diff --git a/Makefile b/Makefile index 21533a4f..fcb9cda5 100644 --- a/Makefile +++ b/Makefile @@ -59,10 +59,10 @@ pylintshort: @find . -name "*.py" -exec pylint $(PYLINT_ARGS) {} \; 2>/dev/null |perl -ne "print if(/(Your code has been rated)|(\*\*\*\* Module)/)" nose: - @cd /tmp; mkdir -p gtftk_test; cd gtftk_test; a=`python -c "import os,pygtftk; print(os.path.dirname(pygtftk.__file__))"`; cd $$a ; for i in `find . -name "*.py" | perl -ne 'print unless(/(setup)|(plugin)|(libgtftk.py)|(__)/)'`; do echo "================="; echo $$i; nosetests --with-doctest $$i; done + @cd /tmp; mkdir -p gtftk_test; cd gtftk_test; a=`python -c "import os,pygtftk; print(os.path.dirname(pygtftk.__file__))"`; cd $$a ; for i in `find . -name "*.py" | perl -ne 'print unless(/(setup)|(plugin)|(bwig)|(libgtftk.py)|(__)/)'`; do echo "================="; echo $$i; nosetests --with-doctest $$i; done nose_travis: - @ source activate pygtftk_py3k; mkdir -p ~/tmp; cd ~/tmp ; mkdir -p gtftk_test; cd gtftk_test; a=`python -c "import os,pygtftk; print(os.path.dirname(pygtftk.__file__))"`; echo $$a; cd $$a ; for i in `find . -name "*.py" | perl -ne 'print unless(/(setup)|(plugin)|(libgtftk.py)|(__)/)'`; do echo "================="; echo $$i; nosetests --with-doctest $$i; done + @ source activate pygtftk_py3k; mkdir -p ~/tmp; cd ~/tmp ; mkdir -p gtftk_test; cd gtftk_test; a=`python -c "import os,pygtftk; print(os.path.dirname(pygtftk.__file__))"`; echo $$a; cd $$a ; for i in `find . -name "*.py" | perl -ne 'print unless(/(setup)|(plugin)||(bwig)|(libgtftk.py)|(__)/)'`; do echo "================="; echo $$i; nosetests --with-doctest $$i; done install: @@ -94,10 +94,10 @@ test_cmd: make bats_cmd CMD=$(CMD) %.bats: - @gtftk -l > prgm_list.txt; gtftk -p > test_list.txt; for i in $$(cat prgm_list.txt); do cat test_list.txt | grep -E "@test \"$$i" -A 3 | grep -v "^\-\-$$" > $$i.bats; done + @gtftk -l |sort -r > prgm_list.txt; gtftk -p > test_list.txt; for i in $$(cat prgm_list.txt); do cat test_list.txt | grep -E "@test \"$$i" -A 3 | grep -v "^\-\-$$" > $$i.bats; done %.bats_travis: - @gtftk -l | grep -v select_by_go | grep -v retrieve > prgm_list.txt; gtftk -p > test_list.txt; for i in $$(cat prgm_list.txt); do cat test_list.txt | grep -E "@test \"$$i" -A 3 | grep -v "^\-\-$$" > $$i.bats; done + @gtftk -l |sort -r | grep -v select_by_go | grep -v retrieve > prgm_list.txt; gtftk -p > test_list.txt; for i in $$(cat prgm_list.txt); do cat test_list.txt | grep -E "@test \"$$i" -A 3 | grep -v "^\-\-$$" > $$i.bats; done %.completed : %.bats @bats -t $< @@ -107,13 +107,13 @@ test_cmd: @bats -t $< @echo "completed" > $@ -OUTPUT = $(eval OUTPUT := $$(shell gtftk -l 2>/dev/null))$(OUTPUT) +OUTPUT = $(eval OUTPUT := $$(shell gtftk -l |sort -r 2>/dev/null))$(OUTPUT) OUTPUT2 = $(addsuffix .completed, $(OUTPUT)) test_para: $(OUTPUT2) -OUTPUT3 = $(eval OUTPUT3 := $$(shell gtftk -l | grep -v select_by_go | grep -v retrieve 2>/dev/null))$(OUTPUT3) +OUTPUT3 = $(eval OUTPUT3 := $$(shell gtftk -l |sort -r | grep -v select_by_go | grep -v retrieve 2>/dev/null))$(OUTPUT3) OUTPUT4 = $(addsuffix .completed, $(OUTPUT3)) test_para_travis: $(OUTPUT4) @@ -121,7 +121,7 @@ test_para_travis: $(OUTPUT4) clean: @make bats_cmd CMD=clean - @git checkout docs/source/conf.py pygtftk/version.py; rm -rf simple* control_list_reference.txt control_list_data.txt add_attr_to_pos.tab test.py pygtftk.egg-info build airway_love.txt* ENCFF630HEX_Total_RNAseq_K562_count_mini.txt STDIN.e* closest_1.tsv STDIN.o* dist cmd_list.txt example_list.txt tmp_list.txt simple.chromInfo prgm_list.txt test_list.txt *.bats *.completed *mini_real* heatmap_* tx_classes* *~ \#* hh profile_* toto tott; cd docs/; make clean; cd ..; find . -type f -name '*~' -exec rm -f '{}' \; + @git checkout docs/source/conf.py pygtftk/version.py; rm -rf expected_s* ids* diff_fasta.py chr1_hg38_10M.fa* observed_s* order_fasta.py simple* control_list_reference.txt control_list_data.txt add_attr_to_pos.tab test.py pygtftk.egg-info build airway_love.txt* ENCFF630HEX_Total_RNAseq_K562_count_mini.txt STDIN.e* closest_1.tsv STDIN.o* dist cmd_list.txt example_list.txt tmp_list.txt simple.chromInfo prgm_list.txt test_list.txt *.bats *.completed *mini_real* heatmap_* tx_classes* *~ \#* hh profile_* toto tott; cd docs/; make clean; cd ..; find . -type f -name '*~' -exec rm -f '{}' \; check_cmd_has_example: @for i in $$(gtftk -l); do if grep -q "^$$i" docs/source/presentation.rst; then echo "" >/dev/null; else echo $$i; fi; done diff --git a/README.rst b/README.rst index be527b06..6f805361 100644 --- a/README.rst +++ b/README.rst @@ -129,3 +129,5 @@ Running unitary tests Several unitary tests have been implemented using doctests. You can run them using nose through the following command line: :: make nose + + diff --git a/bin/gtftk b/bin/gtftk index 37af8996..d678873d 100644 --- a/bin/gtftk +++ b/bin/gtftk @@ -24,6 +24,7 @@ from pygtftk.utils import flatten_list from pygtftk.utils import message from pygtftk.utils import silentremove from pygtftk.version import __version__ +from pygtftk.bwig.bw_coverage import TMP_FILE_POOL_MANAGER # Avoid warning message emitted by numpy # https://tinyurl.com/ybev6zrw @@ -92,9 +93,9 @@ def main(): if __name__ == "__main__": - from signal import signal, SIGPIPE, SIG_DFL + #from signal import signal, SIGPIPE, SIG_DFL - signal(SIGPIPE, SIG_DFL) + #signal(SIGPIPE, SIG_DFL) try: @@ -104,19 +105,21 @@ if __name__ == "__main__": # delete created temporary files - for i in flatten_list(TMP_FILE_LIST, outlist=[]): + for i in flatten_list(TMP_FILE_LIST + list(TMP_FILE_POOL_MANAGER), outlist=[]): # If the user ask to keep temp files if args.tmp_dir is not None: - message("Keeping temporary file :" + i) + message("Keeping temp file : " + i) base_name_i = os.path.basename(i) shutil.move(i, os.path.join(args.tmp_dir, base_name_i)) else: - message("Deleting temporary file :" + i, type="DEBUG") + message("Deleting temp file : " + i, type="DEBUG") silentremove(i) except KeyboardInterrupt: message("Canceled on user request.") sys.exit(0) + except BrokenPipeError: + pass sys.exit(0) diff --git a/changelog.md b/changelog.md index 68781d73..b2f4fca8 100644 --- a/changelog.md +++ b/changelog.md @@ -1,5 +1,34 @@ # Changelog +## v0.9.9 + +### Bug Fixes + +- Fix a critical bug in get_sequence that affected get_feat_seq and get_tx_seq. +- Select_by_key now throw an error when no key/val are available. +- No more function with mutable objects as default arguments. +- Fix temporary file deletion. + +### API Changes + +- Refactored arg_formatter by creating a single type (ranged_num) to test for numeric inputs. +- Refactored all plugins so that there is no more reference to unused arguments (tmp_dir, verbosity...). + + +### Code changes + +- No more reference to PY2. +- Added several test to get_tx_seq and get_feat_seq. +- Added several script to manipulate fasta files (see 'tools' folder). For pygtftk dev. +- Added 'extra_require' slot in setup(). +- The get-feature-seq program now relies on bedtools (not on internal C code). This may change in the future asa a more flexible C interface is available. + +### New Features + +- Added --list-bigwigs to profile (to display the content of a coverage file). +- Added a novel dataset (mini_real_10M) derived from mini_real and containing 10 Mb of chr1. +- The configuration directory now supports several subdirectories named based on a hash string computed from path to the gtftk program. + ## v0.9.8 diff --git a/docs/source/_static/example_01.png b/docs/source/_static/example_01.png index df8331e9..fbce1fad 100644 Binary files a/docs/source/_static/example_01.png and b/docs/source/_static/example_01.png differ diff --git a/docs/source/_static/example_01b.png b/docs/source/_static/example_01b.png index b22f767d..a63c47bc 100644 Binary files a/docs/source/_static/example_01b.png and b/docs/source/_static/example_01b.png differ diff --git a/docs/source/_static/example_02.png b/docs/source/_static/example_02.png index f7a57726..3de23c5e 100644 Binary files a/docs/source/_static/example_02.png and b/docs/source/_static/example_02.png differ diff --git a/docs/source/_static/example_05.png b/docs/source/_static/example_05.png index a6705ddc..962ebe4c 100644 Binary files a/docs/source/_static/example_05.png and b/docs/source/_static/example_05.png differ diff --git a/docs/source/_static/example_06.png b/docs/source/_static/example_06.png index 751bd06d..3f08ee0b 100644 Binary files a/docs/source/_static/example_06.png and b/docs/source/_static/example_06.png differ diff --git a/docs/source/_static/example_06b.png b/docs/source/_static/example_06b.png index 9e81172d..c51a456a 100644 Binary files a/docs/source/_static/example_06b.png and b/docs/source/_static/example_06b.png differ diff --git a/docs/source/_static/example_07.png b/docs/source/_static/example_07.png index 586a8f8d..935b48c2 100644 Binary files a/docs/source/_static/example_07.png and b/docs/source/_static/example_07.png differ diff --git a/docs/source/_static/example_08.png b/docs/source/_static/example_08.png index 1249ec41..6de5819f 100644 Binary files a/docs/source/_static/example_08.png and b/docs/source/_static/example_08.png differ diff --git a/docs/source/_static/example_13.png b/docs/source/_static/example_13.png index 67c26660..12c83599 100644 Binary files a/docs/source/_static/example_13.png and b/docs/source/_static/example_13.png differ diff --git a/docs/source/annotation.rst b/docs/source/annotation.rst new file mode 100644 index 00000000..9c86bc8e --- /dev/null +++ b/docs/source/annotation.rst @@ -0,0 +1,149 @@ +Commands from section 'annotation' +------------------------------------ + + +closest_gn_to_feat +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Find the n closest genes/transcripts for each peak (or the oppposite). + +**Example:** Find the closest tss to a set of peak + +.. command-output:: gtftk closest_gn_to_feat -t tss -r simple_peaks.bed6 -i simple.gtf -c simple.chromInfo -p 10 -K toto -n transcript_id,gene_id + :shell: + +**Example:** Find the closest tss to a set of peak. Use the gene-centric and uncollapsed outout. + +.. command-output:: gtftk closest_gn_to_feat -t tss -r simple_peaks.bed6 -i simple.gtf -c simple.chromInfo -p 10 -K toto -n transcript_id,gene_id -gu + :shell: + + +**Arguments:** + +.. command-output:: gtftk closest_gn_to_feat -h + :shell: + + +closest_genes +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Find the n closest genes for each transcript. + +**Example:** + +.. command-output:: gtftk get_example | bedtools sort | gtftk closest_genes -f + :shell: + + +**Arguments:** + +.. command-output:: gtftk closest_genes -h + :shell: + + +overlapping +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Find transcripts whose body/TSS/TTS region extended in 5' and 3' (-u/-d) overlaps with any transcript from another gene. Strandness is not considered by default. Used --invert-match to find those that do not overlap. If --annotate-gtf is used, all lines of the input GTF file will be printed and a new key containing the list of overlapping transcripts will be added to the transcript features/lines (key will be 'overlapping_*' with * one of body/TSS/TTS). The --annotate-gtf and --invert-match arguments are mutually exclusive. + + +**Example:** Find transcript whose promoter overlap transcript from other genes. + +.. command-output:: gtftk get_example -f chromInfo > simple_join_chromInfo.txt; gtftk get_example | gtftk overlapping -c simple_join_chromInfo.txt -t promoter -u 10 -d 10 -a | gtftk select_by_key -k feature -v transcript | gtftk tabulate -k transcript_id,overlap_promoter_u0.01k_d0.01k | head + :shell: + + +**Arguments:** + +.. command-output:: gtftk overlapping -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +divergent +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Find transcript with divergent promoters. These transcripts will be defined here +as those whose promoter region (defined by -u/-d) overlaps with the tss of +another gene in reverse/antisens orientation. This may be useful to select +coding genes in head-to-head orientation or LUAT as described in "Divergent +transcription is associated with promoters of transcriptional regulators" +(Lepoivre C, BMC Genomics, 2013). The ouput is a GTF with an additional key +('divergent') whose value is set to '.' if the gene has no antisens transcript +in its promoter region. If the gene has an antisens transcript in its promoter +region the 'divergent' key is set to the identifier of the transcript whose tss +is the closest relative to the considered promoter. The tss to tss distance is +also provided as an additional key (dist_to_divergent). + + +**Example:** Flag divergent transcripts in the example dataset. Select them and produce a tabulated output. + +.. command-output:: gtftk get_example -f chromInfo > simple_join_chromInfo.txt; gtftk get_example | gtftk divergent -c simple_join_chromInfo.txt -u 10 -d 10| gtftk select_by_key -k feature -v transcript | gtftk tabulate -k transcript_id,divergent,dist_to_divergent | head -n 7 + :shell: + +**Arguments:** + +.. command-output:: gtftk divergent -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +convergent +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Find transcript with convergent tts. These transcripts will be defined here +as those whose tts region (defined by -u/-d) overlaps with the tts of +another gene in reverse/antisens orientation. The ouput is a GTF with an +additional key ('convergent') whose value is set to '.' if the gene has no +convergent transcript in its tts region. If the gene has an antisens transcript +in its tts region the 'convergent' key is set to the identifier of the +transcript whose tts is the closest relative to the considered tts. +The tts to tts distance is also provided as an additional key (dist_to_convergent). + + +**Example:** Flag divergent transcripts in the example dataset. Select them and produce a tabulated output. + +.. command-output:: gtftk get_example -f chromInfo > simple_join_chromInfo.txt; gtftk get_example | gtftk convergent -c simple_join_chromInfo.txt -u 25 -d 25| gtftk select_by_key -k feature -v transcript | gtftk tabulate -k transcript_id,convergent,dist_to_convergent| head -n 4 + :shell: + +**Arguments:** + +.. command-output:: gtftk convergent -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +exon_sizes +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Add a new key to transcript features containing a comma separated list of exon sizes. + + +**Example:** + +.. command-output:: gtftk get_example | gtftk exon_sizes | gtftk select_by_key -t + :shell: + +**Arguments:** + +.. command-output:: gtftk exon_sizes -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + + +intron_sizes +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Add a new key to transcript features containing a comma separated list of intron sizes. + + +**Example:** + +.. command-output:: gtftk get_example | gtftk intron_sizes | gtftk select_by_key -t + :shell: + +**Arguments:** + +.. command-output:: gtftk intron_sizes -h + :shell: diff --git a/docs/source/conf.py b/docs/source/conf.py index 2b8de6da..a11860ee 100644 --- a/docs/source/conf.py +++ b/docs/source/conf.py @@ -55,10 +55,10 @@ # built documents. # # The short X.Y version. -version = u'0.9.8' +version = u'0.9.8.dev0+8f76' # The full version, including alpha/beta/rc tags. -release = u'0.9.8' +release = u'0.9.8.dev0+8f76' # The language for content autogenerated by Sphinx. Refer to documentation # for a list of supported languages. diff --git a/docs/source/convertion.rst b/docs/source/convertion.rst new file mode 100644 index 00000000..669e1e6d --- /dev/null +++ b/docs/source/convertion.rst @@ -0,0 +1,85 @@ +Commands from section 'convertion' +----------------------------------- + +convert +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** This command can be used to convert to various formats. Currently only a limited number is supported. + +* **bed**: classical bed6 format. +* **bed6**: classical bed6 format. +* **bed3**: bed3 format. + + +**Example:** Get the gene features and convert them to bed6. + +.. command-output:: gtftk get_example | gtftk select_by_key -k feature -v gene | gtftk convert -n gene_id -f bed6| head -n 3 + :shell: + + +**Arguments:** + +.. command-output:: gtftk convert -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +tabulate +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Extract key/values from the GTF and convert them to tabulated format. When requesting coordinates they will be provided in 1-based format. + + +**Example:** Simply get the list of transcripts and gene. + +.. command-output:: gtftk get_example -f gtf | gtftk select_by_key -k feature -v transcript| gtftk tabulate -k gene_id,transcript_id -s "|" + :shell: + +.. warning:: By default tabulate will discard any line for which one of the selected key is not defined. Use -x (--accept-undef) to print them. + + +**Arguments:** + +.. command-output:: gtftk tabulate -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + + +bed_to_gtf +~~~~~~~~~~~~~~~~~~~~~~ + + +**Description:** Convert a bed file to gtf-like format. + +**Example:** + +.. command-output:: gtftk get_example |gtftk convert| gtftk bed_to_gtf -t transcript | head -n 5 + :shell: + + +**Arguments:** + +.. command-output:: gtftk bed_to_gtf -h + :shell: + + +------------------------------------------------------------------------------------------------------------------ + + +convert_ensembl +~~~~~~~~~~~~~~~~~~~~~~ + + +**Description:** Convert the GTF file to ensembl format. Essentially add 'transcript'/'gene' features. + +**Example:** Delete gene and transcript feature. Regenerate them. + +.. command-output:: gtftk get_example | gtftk select_by_key -k feature -v gene,transcript -n| gtftk convert_ensembl | gtftk select_by_key -k gene_id -v G0001 + :shell: + + +**Arguments:** + +.. command-output:: gtftk bed_to_gtf -h + :shell: diff --git a/docs/source/coordinates.rst b/docs/source/coordinates.rst new file mode 100644 index 00000000..d44cee8f --- /dev/null +++ b/docs/source/coordinates.rst @@ -0,0 +1,121 @@ +Commands from section 'coordinates' +----------------------------------- + +midpoints +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Get the genomic midpoint of each features: genes, transcripts, exons or introns. Output is currently in bed format only. + + +**Example:** Get mipoints of all transcripts and exons. + +.. command-output:: gtftk get_example | gtftk midpoints -t transcript,exon -n transcript_id,feature | head -n 5 + :shell: + + +**Arguments:** + +.. command-output:: gtftk midpoints -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +get_5p_3p_coords +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Get the 5p or 3p coordinates for each feature (e.g TSS or TTS for a transcript). +Output is bed format. + +**Example:** Get the 5p ends of transcripts and exons. + +.. command-output:: gtftk get_example | gtftk get_5p_3p_coords -t transcript,exon -n transcript_id,gene_id,feature | head -n 5 + :shell: + + +**Arguments:** + +.. command-output:: gtftk get_5p_3p_coords -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + + +intergenic +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Extract intergenic regions. This command requires a chromInfo file to compute +the bed file boundaries. The command will print the coordinates of genomic +regions without transcript features. + + +**Example:** Simply get intergenic regions. + +.. command-output:: gtftk get_example -f chromInfo > simple_join_chromInfo.txt; gtftk get_example | gtftk intergenic -c simple_join_chromInfo.txt + :shell: + +**Arguments:** + +.. command-output:: gtftk intergenic -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +intronic +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Returns a bed file containing the intronic regions. If by_transcript is false +(default), returns merged genic regions with no exonic overlap ("strict" mode). +Otherwise, the intronic regions corresponding to each transcript are returned +(may contain exonic overlap and redundancy). + +**Example:** Simply get intronic regions. + +.. command-output:: gtftk get_example | gtftk intronic | head -n 5 + :shell: + + +**Arguments:** + +.. command-output:: gtftk intronic -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + + +splicing_site +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Compute the locations of donor and acceptor splice sites. This command will return a single position which corresponds to the most 5' and/or the most 3' intronic region. If the gtf file does not contain exon numbering you can compute it using the +add_exon_nb command. The score column of the bed file contain the number of the closest exon relative to the splice site. + +**Example:** + +.. command-output:: gtftk get_example | gtftk add_exon_nb -k exon_nbr | gtftk splicing_site -k exon_nbr| head + :shell: + +**Arguments:** + +.. command-output:: gtftk splicing_site -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +shift +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Shift coordinates in 3' or 5' direction. + +**Example:** + +.. command-output:: gtftk get_example| head -n 1 + :shell: + +.. command-output:: gtftk get_example -f chromInfo > simple.chromInfo; gtftk get_example | gtftk shift -s -10 -c simple.chromInfo | head -n 1 + :shell: + + +**Arguments:** + +.. command-output:: gtftk shift -h + :shell: + diff --git a/docs/source/coverage.rst b/docs/source/coverage.rst new file mode 100644 index 00000000..e39707ae --- /dev/null +++ b/docs/source/coverage.rst @@ -0,0 +1,191 @@ +Commands from section 'coverage' +---------------------------------- + +coverage +~~~~~~~~ + +**Description:** Takes a GTF as input to compute bigwig coverage in regions of interest (promoter, transcript body, intron, intron_by_tx, tts...) or a BED6 to focus on user-defined regions. If --n-highest is used the program will compute the coverage of each bigwig based on the average value of the n windows (--nb-window) with the highest coverage values. +Regions were signal can be computed (if GTF file as input) are promoter, tts, introns, intergenic regions or any feature available in the GTF file (transcript, exon, gene...). +If --matrix-out is selected, the signal for each bigwig will be provided in a dedicated column. Otherwise, signal for each bigwig is provided through a dedicated line. + + + **Example:** + +We will first request a lightweight example dataset (but more realistic than the 'simple' dataset). + + +.. command-output:: gtftk get_example -d mini_real_noov_rnd_tx -f '*' + :shell: + + +.. command-output:: gtftk get_example -d mini_real -f '*' + :shell: + + +Now we will compute coverage of promoters regions using 3 bigWig files as input. + + +.. command-output:: gtftk coverage -l H3K4me3,H3K79me2,H3K36me3 -u 5000 -d 5000 -i mini_real_noov_rnd_tx.gtf.gz -c hg38.genome -m transcript_id,gene_name -x ENCFF742FDS_H3K4me3_K562_sub.bw ENCFF947DVY_H3K79me2_K562_sub.bw ENCFF431HAA_H3K36me3_K562_sub.bw -k 4 > coverage.bed + :shell: + + +Now we can have a look at the result: + +.. command-output:: head -n 10 coverage.bed + :shell: + + +**Arguments:** + +.. command-output:: gtftk coverage -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + + +mk_matrix +~~~~~~~~~~ + +Description: Gtftk implements commands that can be used to produce coverage profiles around genomic features or inside user-defined regions. A coverage matrix need first to be produced from a bwig using the mk_matrix command. + +**Example:** + +We will used the same dataset (mini_real.gtf) as produced above (see help on *coverage* command). + +We can now create a coverage matrix around TSS/TTS or along the full transcript +(with or without 5' and 3' regions). Provide a BED file as *---inputfile* if you +want to use your own, user-specific, regions. +Will will create tree example datasets: + +First we will create a coverage matrix around promoter based on a subset of randomly choose transcripts (one per gene) from the 'mini_real' dataset (see section on the *coverage* command to get info about the construction of the *mini_real_noov_rnd_tx.gtf.gz* dataset). + +.. command-output:: gtftk get_example -f '*' -d mini_real + :shell: + + +.. command-output:: gtftk get_example -f '*' -d mini_real_noov_rnd_tx + :shell: + + +.. command-output:: gtftk mk_matrix -k 5 -i mini_real_noov_rnd_tx.gtf.gz -d 5000 -u 5000 -w 200 -c hg38.genome -l H3K4me3,H3K79me,H3K36me3 ENCFF742FDS_H3K4me3_K562_sub.bw ENCFF947DVY_H3K79me2_K562_sub.bw ENCFF431HAA_H3K36me3_K562_sub.bw -o mini_real_promoter + :shell: + + + +The following command compute coverage profil along the whole transcript. + + +.. command-output:: gtftk mk_matrix -k 5 --bin-around-frac 0.5 -i mini_real_noov_rnd_tx.gtf.gz -t transcript -d 5000 -u 5000 -w 200 -c hg38.genome -l H3K4me3,H3K79me,H3K36me3 ENCFF742FDS_H3K4me3_K562_sub.bw ENCFF947DVY_H3K79me2_K562_sub.bw ENCFF431HAA_H3K36me3_K562_sub.bw -o mini_real_tx + :shell: + + +.. command-output:: gtftk mk_matrix -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + + +profile +~~~~~~~ + + +Description: This command is used to create profil diagrams from a *mk_matrix* output. The two important arguments for +this command are *---group-by*, that defines the variable controling the set of colored lines and *---facet-var* that defines the variable controling the way the plot is facetted . Both *---group-by* and *---facet-var* should be set to one of *bwig*, *tx_classes* or *chrom*. + + +**Basic profiles** + +A simple overlayed profile of all epigenetic marks around promoter. Here *---group-by* is, by default set to *bwig* and *---facet-var* is set to None. Thus a single plot with several lines corresponding to bwig coverage is obtained. + + + +.. command-output:: gtftk profile -D -i mini_real_promoter.zip -o profile_prom -pf png -if example_01.png + :shell: + +.. image:: _static/example_01.png + :width: 75% + :target: _static/example_01.png + +Changing colors and applying color order can be done using the following syntax: + + +.. command-output:: gtftk profile -D -i mini_real_promoter.zip -c 'red,blue,violet' -d H3K79me,H3K4me3,H3K36me3 -o profile_prom -pf png -if example_01b.png + :shell: + + +.. image:: _static/example_01b.png + :width: 75% + :target: _static/example_01b.png + + +Transcript coverage is obtained using the *mini_real_tx.zip* matrix. This provides a simple overlayed profile of all epigenetic marks along the transcript body extended in 5' and 3' regions: + +.. command-output:: gtftk profile -D -i mini_real_tx.zip -o profile_tx -pf png -if example_02.png + :shell: + + +.. image:: _static/example_02.png + :width: 75% + :target: _static/example_02.png + +**Faceted profiles** + +Faceted plot of epigenetic profiles. The groups (i.e colors/lines) can be set to bwig classes and the facets to transcript classes. Things can be simply done by providing an additional file containing the transcript and their associated classes. + + +**Example:** + + +.. command-output:: gtftk profile -D -i mini_real_promoter.zip -f tx_classes -g bwig -t tx_classes.txt -o profile_prom -pf png -if example_05.png -e -V 2 -fc 2 + :shell: + + +.. image:: _static/example_05.png + :width: 75% + :target: _static/example_05.png + + +Alternatively, the groups can be set to chromosomes or transcript classes: + + +.. command-output:: gtftk profile -D -i mini_real_promoter.zip -g tx_classes -f bwig -t tx_classes.txt -o profile_prom -pf png -if example_06.png -V 2 -nm ranging + :shell: + + +.. image:: _static/example_06.png + :width: 75% + :target: _static/example_06.png + + +.. command-output:: gtftk profile -D -i mini_real_promoter.zip -g chrom -f bwig -t tx_classes.txt -o profile_prom -pf png -if example_06b.png -V 2 -nm ranging + :shell: + + +.. image:: _static/example_06b.png + :width: 75% + :target: _static/example_06b.png + + +Note that facets may also be associated to epigenetic marks. In this case each the --group-by can be set to *tx_classes* or *chrom*. + + +.. command-output:: gtftk profile -D -i mini_real_tx.zip -g tx_classes -t tx_classes.txt -f bwig -o profile_tx -pf png -if example_07.png -w -nm ranging + :shell: + + +.. image:: _static/example_07.png + :width: 75% + :target: _static/example_07.png + + +.. command-output:: gtftk profile -D -i mini_real_tx.zip -g chrom -f bwig -o profile_tx -pf png -if example_08.png -w -nm ranging + :shell: + + +.. image:: _static/example_08.png + :width: 75% + :target: _static/example_08.png + +.. command-output:: gtftk profile -h + :shell: + diff --git a/docs/source/editing.rst b/docs/source/editing.rst new file mode 100644 index 00000000..3836e898 --- /dev/null +++ b/docs/source/editing.rst @@ -0,0 +1,157 @@ +Commands from section 'Editing' +---------------------------------- + + +add_prefix +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Add a prefix (or suffix) to one of the attribute value (*e.g.* gene_id) + +**Example:** + +.. command-output:: gtftk get_example| gtftk add_prefix -k transcript_id -t "novel_"| head -2 + :shell: + +**Arguments:** + +.. command-output:: gtftk add_prefix -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +del_attr +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Delete an attribute and its corresponding values. + +**Example:** + +.. command-output:: gtftk get_example | gtftk del_attr -k transcript_id,gene_id,exon_id | head -3 + :shell: + +**Arguments:** + +.. command-output:: gtftk del_attr -h + :shell: + + +------------------------------------------------------------------------------------------------------------------ + +join_attr +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Add attributes from a file. This command can be used to import additional key/values into the gtf (e.g CPAT for coding potential, DESeq for differential analysis...). The imported file can be in 2 formats (2 columns or matrix): + +- With a 2-columns file: + + - value for joining (transcript_id or gene_id...). + - corresponding value. + +- With a matrix (see -m): + + - rows corresponding to joining keys (transcript_id or gene_id or...). + - columns corresponding to novel attributes name. + - Each cell of the matrix is a value for the corresponding attribute. + + +**Example:** With a 2-columns file. + +.. command-output:: gtftk get_example -f join > simple_join.txt + :shell: + +.. command-output:: cat simple_join.txt + :shell: + +.. command-output:: gtftk get_example -f gtf | gtftk join_attr -k gene_id -j simple_join.txt -n a_score -t gene| gtftk select_by_key -k feature -v gene + :shell: + +**Example:** With a matrix-like file. + +.. command-output:: gtftk get_example -f join_mat > simple_join_mat.txt + :shell: + +.. command-output:: cat simple_join_mat.txt + :shell: + +.. command-output:: gtftk get_example -f gtf | gtftk join_attr -k gene_id -j simple_join_mat.txt -m -t gene| gtftk select_by_key -k feature -v gene + :shell: + + +**Arguments:** + +.. command-output:: gtftk join_attr -h + :shell: + + +------------------------------------------------------------------------------------------------------------------ + +join_multi_file +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Join attributes from mutiple files. + + +**Example:** Add key/value to gene features. + +.. command-output:: gtftk get_example | gtftk join_multi_file -k gene_id -t gene simple.join_mat_2 simple.join_mat_3| gtftk select_by_key -g + :shell: + +**Arguments:** + +.. command-output:: gtftk join_multi_file -h + :shell: + + + +------------------------------------------------------------------------------------------------------------------ + +merge_attr +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Merge a set of attributes into a destination attribute. + + +**Example:** Merge gene_id and transcript_id into a new key associated to transcript features. + +.. command-output:: gtftk get_example | gtftk merge_attr -k transcript_id,gene_id -d txgn_id -s "|" -f transcript | gtftk select_by_key -t + :shell: + + +**Arguments:** + +.. command-output:: gtftk join_multi_file -h + :shell: + + +------------------------------------------------------------------------------------------------------------------ + + +discretize_key +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Create a new key by discretizing a numeric key. This can be helpful to create new classes of features on the fly. +The default is to create equally spaced interval. The intervals can also be created by computing the percentiles (-p) which will provide balanced classes most suitable generally. + + +**Example:** Let say we have the following matrix giving expression level of genes (rows) in samples (columns). We could join this information to the GTF and later choose to transform key *S1* into a new discretized key *S1_d*. We may apply particular labels to this factor using *-l*. + + +.. command-output:: gtftk get_example | gtftk join_attr -j simple.join_mat -k gene_id -m | gtftk discretize_key -k S1 -d S1_d -n 2 -l A,B | gtftk select_by_key -k feature -v gene + :shell: + +**Example:** We want to load RNA-seq data in the GTF (obtained through the get_example command) and discretize the expression values according to deciles (-p and -n set to 10). Classes will be labeled from A to J. The example below shows how balanced these classes will be. + +.. seealso:: The *profile* command that could be used to asses the associated epigenetic marks of these 10 gene classes. + + +.. command-output:: gtftk get_example -d mini_real -f "*" + :shell: + +.. command-output:: gtftk get_example -d mini_real | gtftk join_attr -H -j mini_real_counts_ENCFF630HEX.tsv -k gene_name -n exprs -t gene | gtftk discretize_key -k exprs -p -d exprs_class -n 10 -l A,B,C,D,E,F,G,H,I,J | gtftk tabulate -k exprs_class -Hn | sort | uniq -c + :shell: + +**Arguments:** + +.. command-output:: gtftk discretize_key -h + :shell: + diff --git a/docs/source/example_01.png b/docs/source/example_01.png index aff71a82..a94a5f39 100644 Binary files a/docs/source/example_01.png and b/docs/source/example_01.png differ diff --git a/docs/source/example_01b.png b/docs/source/example_01b.png index 67c7df5f..a63c47bc 100644 Binary files a/docs/source/example_01b.png and b/docs/source/example_01b.png differ diff --git a/docs/source/example_02.png b/docs/source/example_02.png index c7c2f230..d73f1040 100644 Binary files a/docs/source/example_02.png and b/docs/source/example_02.png differ diff --git a/docs/source/example_05.png b/docs/source/example_05.png index 72ec678e..309727a9 100644 Binary files a/docs/source/example_05.png and b/docs/source/example_05.png differ diff --git a/docs/source/example_06.png b/docs/source/example_06.png index 00c9ead6..893ef2cc 100644 Binary files a/docs/source/example_06.png and b/docs/source/example_06.png differ diff --git a/docs/source/example_06b.png b/docs/source/example_06b.png index b93da117..3e66dab1 100644 Binary files a/docs/source/example_06b.png and b/docs/source/example_06b.png differ diff --git a/docs/source/example_07.png b/docs/source/example_07.png index 44ae1a01..942d5260 100644 Binary files a/docs/source/example_07.png and b/docs/source/example_07.png differ diff --git a/docs/source/example_08.png b/docs/source/example_08.png index 7d9ea009..5ccfb3fe 100644 Binary files a/docs/source/example_08.png and b/docs/source/example_08.png differ diff --git a/docs/source/example_13.png b/docs/source/example_13.png index 15051923..10429e67 100644 Binary files a/docs/source/example_13.png and b/docs/source/example_13.png differ diff --git a/docs/source/gtftk_args.rst b/docs/source/gtftk_args.rst new file mode 100644 index 00000000..54a62874 --- /dev/null +++ b/docs/source/gtftk_args.rst @@ -0,0 +1,73 @@ +Help on gtftk Unix commands +============================ + + +Main parser arguments of gtftk +------------------------------- + + +Getting help with -h +~~~~~~~~~~~~~~~~~~~~~ + +The -h argument can be used to get a synopsis for implemented commands. + +.. command-output:: gtftk -h + :shell: + + +------------------------------------------------------------------------------------------------------------------ + + +Activating Bash completion +~~~~~~~~~~~~~~~~~~~~~~~~~~~ + +The code provided below can be useful to activate bash completion. + +.. code-block:: bash + + # Use the -b argument of gtftk + # This will produce a script that you + # should store in your .bashrc + gtftk -b + +Or alternatively + +.. code-block:: bash + + echo "" >> ~/.bashrc + gtftk -b >> ~/.bashrc + + + +------------------------------------------------------------------------------------------------------------------ + + +Getting the list of funtional tests +~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + +One can access to the list of implemented tests through the -p/--plugin-tests arguments. These tests may be run using `bats `_ (Bash Automated Testing System). + + +.. code-block:: bash + + # gtftk --plugin-tests + + + +------------------------------------------------------------------------------------------------------------------ + + +Command-wide arguments +-------------------------- + +**Description:** The following arguments are available in almost all gtftk commands : + +- -h, --help : Argument list and details. +- -i, --inputfile: The input file (may be ). +- -o, --outputfile: The output file (may be ). +- -D, --no-date: Do not add date to output file names. +- -C, --add-chr: Add 'chr' to chromosome names before printing output. +- -V, --verbosity: Increases output verbosity (can take value from 0 to 4). +- -K --tmp-dir: Keep all temporary files into this folder. +- -L, --logger-file: Stores the values of all command line arguments into a file. + diff --git a/docs/source/index.rst b/docs/source/index.rst index 904b3765..698995e0 100644 --- a/docs/source/index.rst +++ b/docs/source/index.rst @@ -1,4 +1,3 @@ - Welcome to pygtftk documentation page -------------------------------------- @@ -25,7 +24,16 @@ Table of content about installation - presentation + gtftk_args + information + editing + selection + convertion + annotation + coordinates + sequence + coverage + miscellaneous api bwig_coverage developers diff --git a/docs/source/information.rst b/docs/source/information.rst new file mode 100644 index 00000000..48fd696d --- /dev/null +++ b/docs/source/information.rst @@ -0,0 +1,273 @@ +Commands from section 'information' +-------------------------------------- + + +apropos +~~~~~~~~~ + +**Description:** Search in all command description files those related to a user-defined keyword. + +**Example:** Search all commands related to promoters. + +.. command-output:: gtftk apropos -k promoter + :shell: + + +**Arguments:** + +.. command-output:: gtftk apropos -h + :shell: + + +------------------------------------------------------------------------------------------------------------------ + +retrieve +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Retrieves a GTF file from ensembl. + +**Example:** List the available GTF files in ensembl FTP. Bacteria are not listed at the moment. + +.. command-output:: # gtftk retrieve -l | head -5 + :shell: + +**Example:** Perform basic statistics on Vicugna pacos genomic annotations. + +.. command-output:: # gtftk retrieve -s vicugna_pacos -c -d | gtftk count -t vicugna_pacos + :shell: + +**Arguments:** + +.. command-output:: gtftk retrieve -h + :shell: + + +------------------------------------------------------------------------------------------------------------------ + +get_example +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Get an example GTF file (or any other kind of example available in the installation directory). This command is only provided for demonstration purpose. + +We can see from the example below that this gtf file **follows the ensembl format** and contains the **transcript and gene features** (column 3). + + +**Example:** The very basic (and artificial) example. + +.. command-output:: gtftk get_example| head -2 + :shell: + + +let's get all files from the *simple* dataset. + +.. command-output:: gtftk get_example -d simple -f '*' + :shell: + +**Arguments:** + +.. command-output:: gtftk get_example -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +add_exon_nb +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Add exon number transcript-wise (based on 5' to 3' orientation). + +**Example:** + +.. command-output:: gtftk get_example | gtftk add_exon_nb -k exon_number | gtftk select_by_key -k feature -v exon | gtftk tabulate -k chrom,start,end,exon_number,transcript_id | head -n 20 + :shell: + + +**Arguments:** + + +.. command-output:: gtftk add_exon_nb -h + :shell: + + +------------------------------------------------------------------------------------------------------------------ + +count +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Count the number of features (transcripts, genes, exons, introns). + +**Example:** + +.. command-output:: gtftk get_example | gtftk count -t example_gtf + :shell: + + +**Arguments:** + +.. command-output:: gtftk count -h + + +------------------------------------------------------------------------------------------------------------------ + +count_key_values +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Count the number of values for a set of keys. + + +**Example:** Count the number of non-redondant entries for chromosomes and transcript_id. + + +.. command-output:: gtftk get_example | gtftk count_key_values -k chrom,transcript_id -u + :shell: + + +**Arguments:** + +.. command-output:: gtftk count_key_values -h + + +------------------------------------------------------------------------------------------------------------------ + +get_attr_list +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Get the list of attributes from a GTF file. + +**Example:** Get the list of attributes in the "simple" dataset. + +.. command-output:: gtftk get_example | gtftk get_attr_list + :shell: + +**Arguments:** + +.. command-output:: gtftk get_attr_list -h + + +------------------------------------------------------------------------------------------------------------------ + +get_attr_value_list +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Get the list of values observed for an attributes. + + +**Example:** Get the number of time each gene_id is used. + +.. command-output:: gtftk get_example | gtftk get_attr_value_list -k gene_id -c -s ';' + :shell: + + +**Arguments:** + +.. command-output:: gtftk get_attr_value_list -h + + +------------------------------------------------------------------------------------------------------------------ + +get_feature_list +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Get the list of features enclosed in the GTF. + +**Example:** Get the list of features enclosed in the GTF. + +.. command-output:: gtftk get_example | gtftk get_feature_list + :shell: + +**Arguments:** + +.. command-output:: gtftk get_feature_list -h + + +------------------------------------------------------------------------------------------------------------------ + +nb_exons +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Count the number of exons and add it as a novel key/value. Output may also be in text format if requested. + +**Example:** + +.. command-output:: gtftk get_example -f gtf | gtftk nb_exons | head -n 5 + :shell: + +**Arguments:** + +.. command-output:: gtftk nb_exons -h + :shell: + + +------------------------------------------------------------------------------------------------------------------ + +nb_transcripts +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Count the number of transcript per gene. + +**Example:** Count the number of transcript per gene. + +.. command-output:: gtftk get_example | gtftk nb_transcripts | gtftk select_by_key -g + :shell: + + +**Arguments:** + +.. command-output:: gtftk nb_transcripts -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +seqid_list +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Return the chromosome list. + +**Example:** Return the chromosome list. + +.. command-output:: gtftk get_example | gtftk seqid_list + :shell: + + +**Arguments:** + +.. command-output:: gtftk seqid_list -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +tss_dist +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Compute the distance between TSSs of pairs of gene transcripts. The tss_num_1 and tss_num_2 columns contains the TSSs number (for transcript_id_1 and transcript_id_2 respectively). Numering starts from 1 (most 5' TSS for a gene) to the number of different TSS coordinates. Two or more transcripts will have the same tss_num if they share a TSS. + +**Example:** An example on the mini_real dataset. + +.. command-output:: gtftk get_example -d mini_real | gtftk tss_dist | head -n 10 + :shell: + + +**Arguments:** + +.. command-output:: gtftk tss_dist -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + + +feature_size +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Get the size and limits (start/end) of features enclosed in the GTF. If bed format is requested returns the limits in bed format and the size as a score. Otherwise output GTF file with 'feat_size' as a new key and size as value + + +**Example:** Add trancript size (mature RNA) to the gtf. + +.. command-output:: gtftk get_example | gtftk feature_size -t mature_rna | gtftk select_by_key -k feature -v transcript | head -n 5 + :shell: + +**Arguments:** + +.. command-output:: gtftk feature_size -h + :shell: + + diff --git a/docs/source/miscellaneous.rst b/docs/source/miscellaneous.rst new file mode 100644 index 00000000..fe073a9d --- /dev/null +++ b/docs/source/miscellaneous.rst @@ -0,0 +1,41 @@ +Commands from section 'miscellaneous' +------------------------------------- + +control_list +~~~~~~~~~~~~~~~~~~~~~ + + +**Description:** Returns a list of gene matched for expression based on reference values. Based on a reference gene list (or more generally IDs) this command tries to extract a set of other genes/IDs matched for signal/expression. The --reference-gene-file contains the list of reference IDs while the --inputfile contains a tuple gene/signal for all genes. + +**Example:** + +.. command-output:: gtftk control_list -i mini_real_counts_ENCFF630HEX.tsv -r mini_real_control_1.txt -D -V 2 -s -l -p 1 -ju -if example_13.png -pf png + :shell: + + +.. image:: _static/example_13.png + :target: _static/example_13.png + + +**Arguments:** + +.. command-output:: gtftk control_list -h + :shell: + + +col_from_tab +~~~~~~~~~~~~~~~~~~~~~~ + + +**Description:** Select columns from a tabulated file based on their names. + +**Example:** + +.. command-output:: gtftk get_example | gtftk select_by_key -t | gtftk tabulate -k '*' -x | gtftk col_from_tab -c transcript_id,gene_id + :shell: + + +**Arguments:** + +.. command-output:: gtftk col_from_tab -h + :shell: \ No newline at end of file diff --git a/docs/source/presentation.rst b/docs/source/presentation.rst deleted file mode 100644 index 36b18efb..00000000 --- a/docs/source/presentation.rst +++ /dev/null @@ -1,1394 +0,0 @@ -Help on gtftk Unix commands -============================ - - -Main parser arguments of gtftk -------------------------------- - - -Getting help with -h -~~~~~~~~~~~~~~~~~~~~~ - -The -h argument can be used to get a synopsis for implemented commands. - -.. command-output:: gtftk -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - - -Activating Bash completion -~~~~~~~~~~~~~~~~~~~~~~~~~~~ - -The code provided below can be useful to activate bash completion. - -.. code-block:: bash - - # Use the -b argument of gtftk - # This will produce a script that you - # should store in your .bashrc - gtftk -b - -Or alternatively - -.. code-block:: bash - - echo "" >> ~/.bashrc - gtftk -b >> ~/.bashrc - - - ------------------------------------------------------------------------------------------------------------------- - - -Getting the list of funtional tests -~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ - -One can access to the list of implemented tests through the -p/--plugin-tests arguments. These tests may be run using `bats `_ (Bash Automated Testing System). - - -.. code-block:: bash - - # gtftk --plugin-tests - - - ------------------------------------------------------------------------------------------------------------------- - - -Command-wide arguments --------------------------- - -**Description:** The following arguments are available in almost all gtftk commands : - -- -h, --help : Argument list and details. -- -i, --inputfile: The input file (may be ). -- -o, --outputfile: The output file (may be ). -- -D, --no-date: Do not add date to output file names. -- -C, --add-chr: Add 'chr' to chromosome names before printing output. -- -V, --verbosity: Increases output verbosity (can take value from 0 to 4). -- -K --tmp-dir: Keep all temporary files into this folder. -- -L, --logger-file: Stores the values of all command line arguments into a file. - - ------------------------------------------------------------------------------------------------------------------- - -Commands from section 'information' --------------------------------------- - - -apropos -~~~~~~~~~ - -**Description:** Search in all command description files those related to a user-defined keyword. - -**Example:** Search all commands related to promoters. - -.. command-output:: gtftk apropos -k promoter - :shell: - - -**Arguments:** - -.. command-output:: gtftk apropos -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - -retrieve -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Retrieves a GTF file from ensembl. - -**Example:** List the available GTF files in ensembl FTP. Bacteria are not listed at the moment. - -.. command-output:: # gtftk retrieve -l | head -5 - :shell: - -**Example:** Perform basic statistics on Vicugna pacos genomic annotations. - -.. command-output:: # gtftk retrieve -s vicugna_pacos -c -d | gtftk count -t vicugna_pacos - :shell: - -**Arguments:** - -.. command-output:: gtftk retrieve -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - -get_example -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Get an example GTF file (or any other kind of example available in the installation directory). This command is only provided for demonstration purpose. - -We can see from the example below that this gtf file **follows the ensembl format** and contains the **transcript and gene features** (column 3). - - -**Example:** The very basic (and artificial) example. - -.. command-output:: gtftk get_example| head -2 - :shell: - - -let's get all files from the *simple* dataset. - -.. command-output:: gtftk get_example -d simple -f '*' - :shell: - -**Arguments:** - -.. command-output:: gtftk get_example -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -add_exon_nb -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Add exon number transcript-wise (based on 5' to 3' orientation). - -**Example:** - -.. command-output:: gtftk get_example | gtftk add_exon_nb -k exon_number | gtftk select_by_key -k feature -v exon | gtftk tabulate -k chrom,start,end,exon_number,transcript_id | head -n 20 - :shell: - - -**Arguments:** - - -.. command-output:: gtftk add_exon_nb -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - -count -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Count the number of features (transcripts, genes, exons, introns). - -**Example:** - -.. command-output:: gtftk get_example | gtftk count -t example_gtf - :shell: - - -**Arguments:** - -.. command-output:: gtftk count -h - - ------------------------------------------------------------------------------------------------------------------- - -count_key_values -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Count the number of values for a set of keys. - - -**Example:** Count the number of non-redondant entries for chromosomes and transcript_id. - - -.. command-output:: gtftk get_example | gtftk count_key_values -k chrom,transcript_id -u - :shell: - - -**Arguments:** - -.. command-output:: gtftk count_key_values -h - - ------------------------------------------------------------------------------------------------------------------- - -get_attr_list -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Get the list of attributes from a GTF file. - -**Example:** Get the list of attributes in the "simple" dataset. - -.. command-output:: gtftk get_example | gtftk get_attr_list - :shell: - -**Arguments:** - -.. command-output:: gtftk get_attr_list -h - - ------------------------------------------------------------------------------------------------------------------- - -get_attr_value_list -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Get the list of values observed for an attributes. - - -**Example:** Get the number of time each gene_id is used. - -.. command-output:: gtftk get_example | gtftk get_attr_value_list -k gene_id -c -s ';' - :shell: - - -**Arguments:** - -.. command-output:: gtftk get_attr_value_list -h - - ------------------------------------------------------------------------------------------------------------------- - -get_feature_list -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Get the list of features enclosed in the GTF. - -**Example:** Get the list of features enclosed in the GTF. - -.. command-output:: gtftk get_example | gtftk get_feature_list - :shell: - -**Arguments:** - -.. command-output:: gtftk get_feature_list -h - - ------------------------------------------------------------------------------------------------------------------- - -nb_exons -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Count the number of exons and add it as a novel key/value. Output may also be in text format if requested. - -**Example:** - -.. command-output:: gtftk get_example -f gtf | gtftk nb_exons | head -n 5 - :shell: - -**Arguments:** - -.. command-output:: gtftk nb_exons -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - -nb_transcripts -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Count the number of transcript per gene. - -**Example:** Count the number of transcript per gene. - -.. command-output:: gtftk get_example | gtftk nb_transcripts | gtftk select_by_key -g - :shell: - - -**Arguments:** - -.. command-output:: gtftk nb_transcripts -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -seqid_list -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Return the chromosome list. - -**Example:** Return the chromosome list. - -.. command-output:: gtftk get_example | gtftk seqid_list - :shell: - - -**Arguments:** - -.. command-output:: gtftk seqid_list -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -tss_dist -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Compute the distance between TSSs of pairs of gene transcripts. The tss_num_1 and tss_num_2 columns contains the TSSs number (for transcript_id_1 and transcript_id_2 respectively). Numering starts from 1 (most 5' TSS for a gene) to the number of different TSS coordinates. Two or more transcripts will have the same tss_num if they share a TSS. - -**Example:** An example on the mini_real dataset. - -.. command-output:: gtftk get_example -d mini_real | gtftk tss_dist | head -n 10 - :shell: - - -**Arguments:** - -.. command-output:: gtftk tss_dist -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - - -feature_size -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Get the size and limits (start/end) of features enclosed in the GTF. If bed format is requested returns the limits in bed format and the size as a score. Otherwise output GTF file with 'feat_size' as a new key and size as value - - -**Example:** Add trancript size (mature RNA) to the gtf. - -.. command-output:: gtftk get_example | gtftk feature_size -t mature_rna | gtftk select_by_key -k feature -v transcript | head -n 5 - :shell: - -**Arguments:** - -.. command-output:: gtftk feature_size -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - -Commands from section 'Editing' ----------------------------------- - - -add_prefix -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Add a prefix (or suffix) to one of the attribute value (*e.g.* gene_id) - -**Example:** - -.. command-output:: gtftk get_example| gtftk add_prefix -k transcript_id -t "novel_"| head -2 - :shell: - -**Arguments:** - -.. command-output:: gtftk add_prefix -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -del_attr -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Delete an attribute and its corresponding values. - -**Example:** - -.. command-output:: gtftk get_example | gtftk del_attr -k transcript_id,gene_id,exon_id | head -3 - :shell: - -**Arguments:** - -.. command-output:: gtftk del_attr -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - -join_attr -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Add attributes from a file. This command can be used to import additional key/values into the gtf (e.g CPAT for coding potential, DESeq for differential analysis...). The imported file can be in 2 formats (2 columns or matrix): - -- With a 2-columns file: - - - value for joining (transcript_id or gene_id...). - - corresponding value. - -- With a matrix (see -m): - - - rows corresponding to joining keys (transcript_id or gene_id or...). - - columns corresponding to novel attributes name. - - Each cell of the matrix is a value for the corresponding attribute. - - -**Example:** With a 2-columns file. - -.. command-output:: gtftk get_example -f join > simple_join.txt - :shell: - -.. command-output:: cat simple_join.txt - :shell: - -.. command-output:: gtftk get_example -f gtf | gtftk join_attr -k gene_id -j simple_join.txt -n a_score -t gene| gtftk select_by_key -k feature -v gene - :shell: - -**Example:** With a matrix-like file. - -.. command-output:: gtftk get_example -f join_mat > simple_join_mat.txt - :shell: - -.. command-output:: cat simple_join_mat.txt - :shell: - -.. command-output:: gtftk get_example -f gtf | gtftk join_attr -k gene_id -j simple_join_mat.txt -m -t gene| gtftk select_by_key -k feature -v gene - :shell: - - -**Arguments:** - -.. command-output:: gtftk join_attr -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - -join_multi_file -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Join attributes from mutiple files. - - -**Example:** Add key/value to gene features. - -.. command-output:: gtftk get_example | gtftk join_multi_file -k gene_id -t gene simple.join_mat_2 simple.join_mat_3| gtftk select_by_key -g - :shell: - -**Arguments:** - -.. command-output:: gtftk join_multi_file -h - :shell: - - - ------------------------------------------------------------------------------------------------------------------- - -merge_attr -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Merge a set of attributes into a destination attribute. - - -**Example:** Merge gene_id and transcript_id into a new key associated to transcript features. - -.. command-output:: gtftk get_example | gtftk merge_attr -k transcript_id,gene_id -d txgn_id -s "|" -f transcript | gtftk select_by_key -t - :shell: - - -**Arguments:** - -.. command-output:: gtftk join_multi_file -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - - -discretize_key -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Create a new key by discretizing a numeric key. This can be helpful to create new classes of features on the fly. -The default is to create equally spaced interval. The intervals can also be created by computing the percentiles (-p) which will provide balanced classes most suitable generally. - - -**Example:** Let say we have the following matrix giving expression level of genes (rows) in samples (columns). We could join this information to the GTF and later choose to transform key *S1* into a new discretized key *S1_d*. We may apply particular labels to this factor using *-l*. - - -.. command-output:: gtftk get_example | gtftk join_attr -j simple.join_mat -k gene_id -m | gtftk discretize_key -k S1 -d S1_d -n 2 -l A,B | gtftk select_by_key -k feature -v gene - :shell: - -**Example:** We want to load RNA-seq data in the GTF (obtained through the get_example command) and discretize the expression values according to deciles (-p and -n set to 10). Classes will be labeled from A to J. The example below shows how balanced these classes will be. - -.. seealso:: The *profile* command that could be used to asses the associated epigenetic marks of these 10 gene classes. - - -.. command-output:: gtftk get_example -d mini_real -f "*" - :shell: - -.. command-output:: gtftk get_example -d mini_real | gtftk join_attr -H -j mini_real_counts_ENCFF630HEX.tsv -k gene_name -n exprs -t gene | gtftk discretize_key -k exprs -p -d exprs_class -n 10 -l A,B,C,D,E,F,G,H,I,J | gtftk tabulate -k exprs_class -Hn | sort | uniq -c - :shell: - -**Arguments:** - -.. command-output:: gtftk discretize_key -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -Commands from section 'selection' ---------------------------------- - - -select_by_key -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Extract lines from the gtf based on key and values. - - -**Example:** Select some features (genes) then some gene_id. - -.. command-output:: gtftk get_example |gtftk select_by_key -k feature -v gene | gtftk select_by_key -k gene_id -v G0002,G0003,G0004 - :shell: - - -**Arguments:** - -.. command-output:: gtftk select_by_key -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -select_by_regexp -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Select lines by testing values of a particular key with a regular expression - -**Example:** Select lines corresponding to gene_names matching the regular expression 'G.*9$'. - -.. command-output:: gtftk get_example | gtftk select_by_regexp -k gene_id -r 'G.*9$' - :shell: - -**Arguments:** - -.. command-output:: gtftk select_by_regexp -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -select_by_intron_size -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Delete genes containing an intron whose size is below s. If -m is selected, any gene whose sum of intronic region length is above s is deleted. Monoexonic genes are kept. - -**Example:** Some genes having transcripts containing an intron whose size is below 80 nucleotides - -.. command-output:: gtftk get_example -d mini_real | gtftk select_by_intron_size -s 80 -vd | gtftk intron_sizes | gtftk tabulate -k gene_name,transcript_id,intron_sizes -Hun - :shell: - -**Arguments:** - -.. command-output:: gtftk select_by_regexp -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -select_by_max_exon_nb -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** For each gene select the transcript with the highest number of exons. - - -**Example:** Select lines corresponding to gene_names matching the regular expression 'BCL.*'. - -.. command-output:: gtftk get_example | gtftk select_by_max_exon_nb | gtftk select_by_key -t - :shell: - -**Arguments:** - -.. command-output:: gtftk select_by_max_exon_nb -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - -select_by_loc -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Select transcripts/gene overlapping a given locations. A transcript is defined here as the genomic region from TSS to TTS including introns. This function will return the transcript and all its associated elements (exons, utr,...) even if only a fraction (e.g intron) of the transcript is overlapping the feature. If -/-ft-type is set to 'gene' returns the gene and all its associated elements. - -**Example:** Select transcripts at a given location. - -.. command-output:: gtftk get_example | gtftk select_by_key -k feature -v transcript | gtftk select_by_loc -l chr1:10-15 - :shell: - -**Arguments:** - -.. command-output:: gtftk select_by_loc -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -select_by_nb_exon -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Select transcripts based on the number of exons. - -**Example:** - -.. command-output:: gtftk get_example | gtftk select_by_nb_exon -m 2 | gtftk nb_exons| gtftk select_by_key -t - :shell: - -**Arguments:** - -.. command-output:: gtftk select_by_nb_exon -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - - -select_by_numeric_value -~~~~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Select lines from a GTF file based on a boolean test on numeric values. - -**Example:** - -.. command-output:: gtftk join_attr -i simple.gtf -j simple.join_mat -k gene_id -m| gtftk select_by_numeric_value -t 'start < 10 and end > 10 and S1 == 0.5555 and S2 == 0.7' -n ".,?" - :shell: - -**Arguments:** - -.. command-output:: gtftk select_by_numeric_value -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - -random_list -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Select a random list of genes or transcripts. - -**Example:** Select randomly 3 transcripts. - -.. command-output:: gtftk get_example | gtftk random_list -n 3| gtftk count - :shell: - - -**Arguments:** - -.. command-output:: gtftk random_list -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -random_tx -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Select randomly up to m transcript for each gene. - -**Example:** Select randomly 1 transcript per gene (*-m 1*). - -.. command-output:: gtftk get_example | gtftk random_tx -m 1| gtftk select_by_key -k feature -v gene,transcript| gtftk tabulate -k gene_id,transcript_id - :shell: - -**Arguments:** - -.. command-output:: gtftk random_tx -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -rm_dup_tss -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** If several transcripts of a gene share the same tss, select only one. - -**Example:** Use rm_dup_tss to select transcripts that will be used for mk_matrix -k 5 (see later). - -.. command-output:: gtftk get_example | gtftk rm_dup_tss| gtftk select_by_key -k feature -v transcript - :shell: - - -**Arguments:** - -.. command-output:: gtftk rm_dup_tss -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - -select_by_go -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Select genes from a GTF file using a Gene Ontology ID (e.g GO:0050789). - -**Example:** Select genes with transcription factor activity from the GTF. They could be used subsequently to test their epigenetic features (see later). - -.. command-output:: # gtftk get_example -d mini_real -f gtf| gtftk select_by_go -s hsapiens | gtftk select_by_key -k feature -v gene | gtftk tabulate -k gene_id,gene_name -Hun | head -6 - :shell: - -**Arguments:** - -.. command-output:: gtftk select_by_go -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - -select_by_tx_size -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Select transcript based on their size (i.e size of mature/spliced transcript). - -**Example:** - -.. command-output:: gtftk get_example | gtftk feature_size -t mature_rna | gtftk select_by_tx_size -m 14 | gtftk tabulate -n -k gene_id,transcript_id,feat_size - :shell: - - -**Arguments:** - -.. command-output:: gtftk select_by_tx_size -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -select_most_5p_tx -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Select the most 5' transcript of each gene. - -**Example:** - -.. command-output:: gtftk get_example | gtftk select_most_5p_tx | gtftk select_by_key -k feature -v transcript| gtftk tabulate -k gene_id,transcript_id - :shell: - -**Arguments:** - -.. command-output:: gtftk select_most_5p_tx -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -short_long -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Get the shortest or longest transcript of each gene - -**Example:** - -.. command-output:: gtftk get_example | gtftk short_long | gtftk select_by_key -k feature -v transcript| gtftk tabulate -k gene_id,transcript_id - :shell: - -**Arguments:** - -.. command-output:: gtftk short_long -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - - - -Commands from section 'convertion' ------------------------------------ - -convert -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** This command can be used to convert to various formats. Currently only a limited number is supported. - -* **bed**: classical bed6 format. -* **bed6**: classical bed6 format. -* **bed3**: bed3 format. - - -**Example:** Get the gene features and convert them to bed6. - -.. command-output:: gtftk get_example | gtftk select_by_key -k feature -v gene | gtftk convert -n gene_id -f bed6| head -n 3 - :shell: - - -**Arguments:** - -.. command-output:: gtftk convert -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -tabulate -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Extract key/values from the GTF and convert them to tabulated format. When requesting coordinates they will be provided in 1-based format. - - -**Example:** Simply get the list of transcripts and gene. - -.. command-output:: gtftk get_example -f gtf | gtftk select_by_key -k feature -v transcript| gtftk tabulate -k gene_id,transcript_id -s "|" - :shell: - -.. warning:: By default tabulate will discard any line for which one of the selected key is not defined. Use -x (--accept-undef) to print them. - - -**Arguments:** - -.. command-output:: gtftk tabulate -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - - -bed_to_gtf -~~~~~~~~~~~~~~~~~~~~~~ - - -**Description:** Convert a bed file to gtf-like format. - -**Example:** - -.. command-output:: gtftk get_example |gtftk convert| gtftk bed_to_gtf -t transcript | head -n 5 - :shell: - - -**Arguments:** - -.. command-output:: gtftk bed_to_gtf -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - - -convert_ensembl -~~~~~~~~~~~~~~~~~~~~~~ - - -**Description:** Convert the GTF file to ensembl format. Essentially add 'transcript'/'gene' features. - -**Example:** Delete gene and transcript feature. Regenerate them. - -.. command-output:: gtftk get_example | gtftk select_by_key -k feature -v gene,transcript -n| gtftk convert_ensembl | gtftk select_by_key -k gene_id -v G0001 - :shell: - - -**Arguments:** - -.. command-output:: gtftk bed_to_gtf -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - - -Commands from section 'annotation' ------------------------------------- - - -closest_genes -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Find the n closest genes for each transcript. - -**Example:** - -.. command-output:: gtftk get_example | bedtools sort | gtftk closest_genes -f - :shell: - - -**Arguments:** - -.. command-output:: gtftk closest_genes -h - :shell: - - -overlapping -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Find transcripts whose body/TSS/TTS region extended in 5' and 3' (-u/-d) overlaps with any transcript from another gene. Strandness is not considered by default. Used --invert-match to find those that do not overlap. If --annotate-gtf is used, all lines of the input GTF file will be printed and a new key containing the list of overlapping transcripts will be added to the transcript features/lines (key will be 'overlapping_*' with * one of body/TSS/TTS). The --annotate-gtf and --invert-match arguments are mutually exclusive. - - -**Example:** Find transcript whose promoter overlap transcript from other genes. - -.. command-output:: gtftk get_example -f chromInfo > simple_join_chromInfo.txt; gtftk get_example | gtftk overlapping -c simple_join_chromInfo.txt -t promoter -u 10 -d 10 -a | gtftk select_by_key -k feature -v transcript | gtftk tabulate -k transcript_id,overlap_promoter_u0.01k_d0.01k | head - :shell: - - -**Arguments:** - -.. command-output:: gtftk overlapping -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -divergent -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Find transcript with divergent promoters. These transcripts will be defined here -as those whose promoter region (defined by -u/-d) overlaps with the tss of -another gene in reverse/antisens orientation. This may be useful to select -coding genes in head-to-head orientation or LUAT as described in "Divergent -transcription is associated with promoters of transcriptional regulators" -(Lepoivre C, BMC Genomics, 2013). The ouput is a GTF with an additional key -('divergent') whose value is set to '.' if the gene has no antisens transcript -in its promoter region. If the gene has an antisens transcript in its promoter -region the 'divergent' key is set to the identifier of the transcript whose tss -is the closest relative to the considered promoter. The tss to tss distance is -also provided as an additional key (dist_to_divergent). - - -**Example:** Flag divergent transcripts in the example dataset. Select them and produce a tabulated output. - -.. command-output:: gtftk get_example -f chromInfo > simple_join_chromInfo.txt; gtftk get_example | gtftk divergent -c simple_join_chromInfo.txt -u 10 -d 10| gtftk select_by_key -k feature -v transcript | gtftk tabulate -k transcript_id,divergent,dist_to_divergent | head -n 7 - :shell: - -**Arguments:** - -.. command-output:: gtftk divergent -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -convergent -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Find transcript with convergent tts. These transcripts will be defined here -as those whose tts region (defined by -u/-d) overlaps with the tts of -another gene in reverse/antisens orientation. The ouput is a GTF with an -additional key ('convergent') whose value is set to '.' if the gene has no -convergent transcript in its tts region. If the gene has an antisens transcript -in its tts region the 'convergent' key is set to the identifier of the -transcript whose tts is the closest relative to the considered tts. -The tts to tts distance is also provided as an additional key (dist_to_convergent). - - -**Example:** Flag divergent transcripts in the example dataset. Select them and produce a tabulated output. - -.. command-output:: gtftk get_example -f chromInfo > simple_join_chromInfo.txt; gtftk get_example | gtftk convergent -c simple_join_chromInfo.txt -u 25 -d 25| gtftk select_by_key -k feature -v transcript | gtftk tabulate -k transcript_id,convergent,dist_to_convergent| head -n 4 - :shell: - -**Arguments:** - -.. command-output:: gtftk convergent -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -exon_sizes -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Add a new key to transcript features containing a comma separated list of exon sizes. - - -**Example:** - -.. command-output:: gtftk get_example | gtftk exon_sizes | gtftk select_by_key -t - :shell: - -**Arguments:** - -.. command-output:: gtftk exon_sizes -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - - -intron_sizes -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Add a new key to transcript features containing a comma separated list of intron sizes. - - -**Example:** - -.. command-output:: gtftk get_example | gtftk intron_sizes | gtftk select_by_key -t - :shell: - -**Arguments:** - -.. command-output:: gtftk intron_sizes -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - - -Commands from section 'coordinates' ------------------------------------ - -midpoints -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Get the genomic midpoint of each features: genes, transcripts, exons or introns. Output is currently in bed format only. - - -**Example:** Get mipoints of all transcripts and exons. - -.. command-output:: gtftk get_example | gtftk midpoints -t transcript,exon -n transcript_id,feature | head -n 5 - :shell: - - -**Arguments:** - -.. command-output:: gtftk midpoints -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -get_5p_3p_coords -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Get the 5p or 3p coordinates for each feature (e.g TSS or TTS for a transcript). -Output is bed format. - -**Example:** Get the 5p ends of transcripts and exons. - -.. command-output:: gtftk get_example | gtftk get_5p_3p_coords -t transcript,exon -n transcript_id,gene_id,feature | head -n 5 - :shell: - - -**Arguments:** - -.. command-output:: gtftk get_5p_3p_coords -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - - -intergenic -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Extract intergenic regions. This command requires a chromInfo file to compute -the bed file boundaries. The command will print the coordinates of genomic -regions without transcript features. - - -**Example:** Simply get intergenic regions. - -.. command-output:: gtftk get_example -f chromInfo > simple_join_chromInfo.txt; gtftk get_example | gtftk intergenic -c simple_join_chromInfo.txt - :shell: - -**Arguments:** - -.. command-output:: gtftk intergenic -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -intronic -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Returns a bed file containing the intronic regions. If by_transcript is false -(default), returns merged genic regions with no exonic overlap ("strict" mode). -Otherwise, the intronic regions corresponding to each transcript are returned -(may contain exonic overlap and redundancy). - -**Example:** Simply get intronic regions. - -.. command-output:: gtftk get_example | gtftk intronic | head -n 5 - :shell: - - -**Arguments:** - -.. command-output:: gtftk intronic -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - - -splicing_site -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Compute the locations of donor and acceptor splice sites. This command will return a single position which corresponds to the most 5' and/or the most 3' intronic region. If the gtf file does not contain exon numbering you can compute it using the -add_exon_nb command. The score column of the bed file contain the number of the closest exon relative to the splice site. - -**Example:** - -.. command-output:: gtftk get_example | gtftk add_exon_nb -k exon_nbr | gtftk splicing_site -k exon_nbr| head - :shell: - -**Arguments:** - -.. command-output:: gtftk splicing_site -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -shift -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Shift coordinates in 3' or 5' direction. - -**Example:** - -.. command-output:: gtftk get_example| head -n 1 - :shell: - -.. command-output:: gtftk get_example -f chromInfo > simple.chromInfo; gtftk get_example | gtftk shift -s -10 -c simple.chromInfo | head -n 1 - :shell: - - -**Arguments:** - -.. command-output:: gtftk shift -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - -Commands from section 'sequence' ---------------------------------- - - -get_tx_seq -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Get transcript sequences in fasta format. - -**Example:** Get sequences of transcripts in 5' to 3' orientation - -.. command-output:: gtftk get_example -f fa > simple.fa; gtftk get_example | gtftk get_tx_seq -g simple.fa | head -n 4 - :shell: - -Note that the format is rather flexible and any combination of key can be exported to the header. - -.. command-output:: gtftk get_example | gtftk get_tx_seq -g simple.fa -l gene_id,transcript_id,feature,chrom,start,end,strand | head -n 2 - :shell: - - -**Arguments:** - -.. command-output:: gtftk get_tx_seq -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - -get_feat_seq -~~~~~~~~~~~~~~~~~~~~~~ - -**Description:** Get feature sequence (e.g exon, UTR...). - - -**Example:** - -.. command-output:: gtftk get_feat_seq -i simple.gtf -g simple.fa -l feature,transcript_id,start -t exon -n | head -10 - :shell: - -**Arguments:** - -.. command-output:: gtftk get_feat_seq -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - - -Commands from section 'coverage' ----------------------------------- - -coverage -~~~~~~~~ - -**Description:** Takes a GTF as input to compute bigwig coverage in regions of interest (promoter, transcript body, intron, intron_by_tx, tts...) or a BED6 to focus on user-defined regions. If --n-highest is used the program will compute the coverage of each bigwig based on the average value of the n windows (--nb-window) with the highest coverage values. -Regions were signal can be computed (if GTF file as input) are promoter, tts, introns, intergenic regions or any feature available in the GTF file (transcript, exon, gene...). -If --matrix-out is selected, the signal for each bigwig will be provided in a dedicated column. Otherwise, signal for each bigwig is provided through a dedicated line. - - - **Example:** - -We will first request a lightweight example dataset (but more realistic than the 'simple' dataset). - - -.. command-output:: gtftk get_example -d mini_real_noov_rnd_tx -f '*' - :shell: - - -.. command-output:: gtftk get_example -d mini_real -f '*' - :shell: - - -Now we will compute coverage of promoters regions using 3 bigWig files as input. - - -.. command-output:: gtftk coverage -l H3K4me3,H3K79me2,H3K36me3 -u 5000 -d 5000 -i mini_real_noov_rnd_tx.gtf.gz -c hg38.genome -m transcript_id,gene_name -x ENCFF742FDS_H3K4me3_K562_sub.bw ENCFF947DVY_H3K79me2_K562_sub.bw ENCFF431HAA_H3K36me3_K562_sub.bw -k 4 > coverage.bed - :shell: - - -Now we can have a look at the result: - -.. command-output:: head -n 10 coverage.bed - :shell: - - -**Arguments:** - -.. command-output:: gtftk coverage -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - - -mk_matrix -~~~~~~~~~~ - -Description: Gtftk implements commands that can be used to produce coverage profiles around genomic features or inside user-defined regions. A coverage matrix need first to be produced from a bwig using the mk_matrix command. - -**Example:** - -We will used the same dataset (mini_real.gtf) as produced above (see help on *coverage* command). - -We can now create a coverage matrix around TSS/TTS or along the full transcript -(with or without 5' and 3' regions). Provide a BED file as *---inputfile* if you -want to use your own, user-specific, regions. -Will will create tree example datasets: - -First we will create a coverage matrix around promoter based on a subset of randomly choose transcripts (one per gene) from the 'mini_real' dataset (see section on the *coverage* command to get info about the construction of the *mini_real_noov_rnd_tx.gtf.gz* dataset). - -.. command-output:: gtftk get_example -f '*' -d mini_real - :shell: - - -.. command-output:: gtftk get_example -f '*' -d mini_real_noov_rnd_tx - :shell: - - -.. command-output:: gtftk mk_matrix -k 5 -i mini_real_noov_rnd_tx.gtf.gz -d 5000 -u 5000 -w 200 -c hg38.genome -l H3K4me3,H3K79me,H3K36me3 ENCFF742FDS_H3K4me3_K562_sub.bw ENCFF947DVY_H3K79me2_K562_sub.bw ENCFF431HAA_H3K36me3_K562_sub.bw -o mini_real_promoter - :shell: - - - -The following command compute coverage profil along the whole transcript. - - -.. command-output:: gtftk mk_matrix -k 5 --bin-around-frac 0.5 -i mini_real_noov_rnd_tx.gtf.gz -t transcript -d 5000 -u 5000 -w 200 -c hg38.genome -l H3K4me3,H3K79me,H3K36me3 ENCFF742FDS_H3K4me3_K562_sub.bw ENCFF947DVY_H3K79me2_K562_sub.bw ENCFF431HAA_H3K36me3_K562_sub.bw -o mini_real_tx - :shell: - - -.. command-output:: gtftk mk_matrix -h - :shell: - ------------------------------------------------------------------------------------------------------------------- - - -profile -~~~~~~~ - - -Description: This command is used to create profil diagrams from a *mk_matrix* output. The two important arguments for -this command are *---group-by*, that defines the variable controling the set of colored lines and *---facet-var* that defines the variable controling the way the plot is facetted . Both *---group-by* and *---facet-var* should be set to one of *bwig*, *tx_classes* or *chrom*. - - -**Basic profiles** - -A simple overlayed profile of all epigenetic marks around promoter. Here *---group-by* is, by default set to *bwig* and *---facet-var* is set to None. Thus a single plot with several lines corresponding to bwig coverage is obtained. - - - -.. command-output:: gtftk profile -D -i mini_real_promoter.zip -o profile_prom -pf png -if example_01.png - :shell: - -.. image:: _static/example_01.png - :width: 75% - :target: _static/example_01.png - -Changing colors and applying color order can be done using the following syntax: - - -.. command-output:: gtftk profile -D -i mini_real_promoter.zip -c 'red,blue,violet' -d H3K79me,H3K4me3,H3K36me3 -o profile_prom -pf png -if example_01b.png - :shell: - - -.. image:: _static/example_01b.png - :width: 75% - :target: _static/example_01b.png - - -Transcript coverage is obtained using the *mini_real_tx.zip* matrix. This provides a simple overlayed profile of all epigenetic marks along the transcript body extended in 5' and 3' regions: - -.. command-output:: gtftk profile -D -i mini_real_tx.zip -o profile_tx -pf png -if example_02.png - :shell: - - -.. image:: _static/example_02.png - :width: 75% - :target: _static/example_02.png - -**Faceted profiles** - -Faceted plot of epigenetic profiles. The groups (i.e colors/lines) can be set to bwig classes and the facets to transcript classes. Things can be simply done by providing an additional file containing the transcript and their associated classes. - - -**Example:** - - -.. command-output:: gtftk profile -D -i mini_real_promoter.zip -f tx_classes -g bwig -fo -t tx_classes.txt -o profile_prom -pf png -if example_05.png -e -V 2 -fc 2 - :shell: - - -.. image:: _static/example_05.png - :width: 75% - :target: _static/example_05.png - - -Alternatively, the groups can be set to chromosomes or transcript classes: - - -.. command-output:: gtftk profile -D -i mini_real_promoter.zip -g tx_classes -f bwig -fo -t tx_classes.txt -o profile_prom -pf png -if example_06.png -V 2 -nm ranging - :shell: - - -.. image:: _static/example_06.png - :width: 75% - :target: _static/example_06.png - - -.. command-output:: gtftk profile -D -i mini_real_promoter.zip -g chrom -f bwig -fo -t tx_classes.txt -o profile_prom -pf png -if example_06b.png -V 2 -nm ranging - :shell: - - -.. image:: _static/example_06b.png - :width: 75% - :target: _static/example_06b.png - - -Note that facets may also be associated to epigenetic marks. In this case each the --group-by can be set to *tx_classes* or *chrom*. - - -.. command-output:: gtftk profile -D -i mini_real_tx.zip -g tx_classes -t tx_classes.txt -f bwig -o profile_tx -pf png -if example_07.png -fo -w -nm ranging - :shell: - - -.. image:: _static/example_07.png - :width: 75% - :target: _static/example_07.png - - -.. command-output:: gtftk profile -D -i mini_real_tx.zip -g chrom -f bwig -o profile_tx -pf png -if example_08.png -fo -w -nm ranging - :shell: - - -.. image:: _static/example_08.png - :width: 75% - :target: _static/example_08.png - -.. command-output:: gtftk profile -h - :shell: - - ------------------------------------------------------------------------------------------------------------------- - - -Commands from section 'miscellaneous' -------------------------------------- - -control_list -~~~~~~~~~~~~~~~~~~~~~ - - -**Description:** Returns a list of gene matched for expression based on reference values. Based on a reference gene list (or more generally IDs) this command tries to extract a set of other genes/IDs matched for signal/expression. The --reference-gene-file contains the list of reference IDs while the --inputfile contains a tuple gene/signal for all genes. - -**Example:** - -.. command-output:: gtftk control_list -i mini_real_counts_ENCFF630HEX.tsv -r mini_real_control_1.txt -D -V 2 -s -l -p 1 -ju -if example_13.png -pf png - :shell: - - -.. image:: _static/example_13.png - :target: _static/example_13.png - - -**Arguments:** - -.. command-output:: gtftk control_list -h - :shell: - - -col_from_tab -~~~~~~~~~~~~~~~~~~~~~~ - - -**Description:** Select columns from a tabulated file based on their names. - -**Example:** - -.. command-output:: gtftk get_example | gtftk select_by_key -t | gtftk tabulate -k '*' -x | gtftk col_from_tab -c transcript_id,gene_id - :shell: - - -**Arguments:** - -.. command-output:: gtftk col_from_tab -h - :shell: \ No newline at end of file diff --git a/docs/source/selection.rst b/docs/source/selection.rst new file mode 100644 index 00000000..430d308d --- /dev/null +++ b/docs/source/selection.rst @@ -0,0 +1,251 @@ +Commands from section 'selection' +--------------------------------- + + +select_by_key +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Extract lines from the gtf based on key and values. + + +**Example:** Select some features (genes) then some gene_id. + +.. command-output:: gtftk get_example |gtftk select_by_key -k feature -v gene | gtftk select_by_key -k gene_id -v G0002,G0003,G0004 + :shell: + + +**Arguments:** + +.. command-output:: gtftk select_by_key -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +select_by_regexp +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Select lines by testing values of a particular key with a regular expression + +**Example:** Select lines corresponding to gene_names matching the regular expression 'G.*9$'. + +.. command-output:: gtftk get_example | gtftk select_by_regexp -k gene_id -r 'G.*9$' + :shell: + +**Arguments:** + +.. command-output:: gtftk select_by_regexp -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +select_by_intron_size +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Delete genes containing an intron whose size is below s. If -m is selected, any gene whose sum of intronic region length is above s is deleted. Monoexonic genes are kept. + +**Example:** Some genes having transcripts containing an intron whose size is below 80 nucleotides + +.. command-output:: gtftk get_example -d mini_real | gtftk select_by_intron_size -s 80 -vd | gtftk intron_sizes | gtftk tabulate -k gene_name,transcript_id,intron_sizes -Hun + :shell: + +**Arguments:** + +.. command-output:: gtftk select_by_regexp -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +select_by_max_exon_nb +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** For each gene select the transcript with the highest number of exons. + + +**Example:** Select lines corresponding to gene_names matching the regular expression 'BCL.*'. + +.. command-output:: gtftk get_example | gtftk select_by_max_exon_nb | gtftk select_by_key -t + :shell: + +**Arguments:** + +.. command-output:: gtftk select_by_max_exon_nb -h + :shell: + + +------------------------------------------------------------------------------------------------------------------ + +select_by_loc +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Select transcripts/gene overlapping a given locations. A transcript is defined here as the genomic region from TSS to TTS including introns. This function will return the transcript and all its associated elements (exons, utr,...) even if only a fraction (e.g intron) of the transcript is overlapping the feature. If -/-ft-type is set to 'gene' returns the gene and all its associated elements. + +**Example:** Select transcripts at a given location. + +.. command-output:: gtftk get_example | gtftk select_by_key -k feature -v transcript | gtftk select_by_loc -l chr1:10-15 + :shell: + +**Arguments:** + +.. command-output:: gtftk select_by_loc -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +select_by_nb_exon +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Select transcripts based on the number of exons. + +**Example:** + +.. command-output:: gtftk get_example | gtftk select_by_nb_exon -m 2 | gtftk nb_exons| gtftk select_by_key -t + :shell: + +**Arguments:** + +.. command-output:: gtftk select_by_nb_exon -h + :shell: + + +------------------------------------------------------------------------------------------------------------------ + + +select_by_numeric_value +~~~~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Select lines from a GTF file based on a boolean test on numeric values. + +**Example:** + +.. command-output:: gtftk join_attr -i simple.gtf -j simple.join_mat -k gene_id -m| gtftk select_by_numeric_value -t 'start < 10 and end > 10 and S1 == 0.5555 and S2 == 0.7' -n ".,?" + :shell: + +**Arguments:** + +.. command-output:: gtftk select_by_numeric_value -h + :shell: + + +------------------------------------------------------------------------------------------------------------------ + +random_list +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Select a random list of genes or transcripts. + +**Example:** Select randomly 3 transcripts. + +.. command-output:: gtftk get_example | gtftk random_list -n 3| gtftk count + :shell: + + +**Arguments:** + +.. command-output:: gtftk random_list -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +random_tx +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Select randomly up to m transcript for each gene. + +**Example:** Select randomly 1 transcript per gene (*-m 1*). + +.. command-output:: gtftk get_example | gtftk random_tx -m 1| gtftk select_by_key -k feature -v gene,transcript| gtftk tabulate -k gene_id,transcript_id + :shell: + +**Arguments:** + +.. command-output:: gtftk random_tx -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +rm_dup_tss +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** If several transcripts of a gene share the same tss, select only one. + +**Example:** Use rm_dup_tss to select transcripts that will be used for mk_matrix -k 5 (see later). + +.. command-output:: gtftk get_example | gtftk rm_dup_tss| gtftk select_by_key -k feature -v transcript + :shell: + + +**Arguments:** + +.. command-output:: gtftk rm_dup_tss -h + :shell: + + +------------------------------------------------------------------------------------------------------------------ + +select_by_go +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Select genes from a GTF file using a Gene Ontology ID (e.g GO:0050789). + +**Example:** Select genes with transcription factor activity from the GTF. They could be used subsequently to test their epigenetic features (see later). + +.. command-output:: # gtftk get_example -d mini_real -f gtf| gtftk select_by_go -s hsapiens | gtftk select_by_key -k feature -v gene | gtftk tabulate -k gene_id,gene_name -Hun | head -6 + :shell: + +**Arguments:** + +.. command-output:: gtftk select_by_go -h + :shell: + + +------------------------------------------------------------------------------------------------------------------ + +select_by_tx_size +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Select transcript based on their size (i.e size of mature/spliced transcript). + +**Example:** + +.. command-output:: gtftk get_example | gtftk feature_size -t mature_rna | gtftk select_by_tx_size -m 14 | gtftk tabulate -n -k gene_id,transcript_id,feat_size + :shell: + + +**Arguments:** + +.. command-output:: gtftk select_by_tx_size -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +select_most_5p_tx +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Select the most 5' transcript of each gene. + +**Example:** + +.. command-output:: gtftk get_example | gtftk select_most_5p_tx | gtftk select_by_key -k feature -v transcript| gtftk tabulate -k gene_id,transcript_id + :shell: + +**Arguments:** + +.. command-output:: gtftk select_most_5p_tx -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +short_long +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Get the shortest or longest transcript of each gene + +**Example:** + +.. command-output:: gtftk get_example | gtftk short_long | gtftk select_by_key -k feature -v transcript| gtftk tabulate -k gene_id,transcript_id + :shell: + +**Arguments:** + +.. command-output:: gtftk short_long -h + :shell: diff --git a/docs/source/sequence.rst b/docs/source/sequence.rst new file mode 100644 index 00000000..b5be6fe5 --- /dev/null +++ b/docs/source/sequence.rst @@ -0,0 +1,43 @@ +Commands from section 'sequence' +--------------------------------- + + +get_tx_seq +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Get transcript sequences in fasta format. + +**Example:** Get sequences of transcripts in 5' to 3' orientation + +.. command-output:: gtftk get_example -f fa > simple.fa; gtftk get_example | gtftk get_tx_seq -g simple.fa | head -n 4 + :shell: + +Note that the format is rather flexible and any combination of key can be exported to the header. + +.. command-output:: gtftk get_example | gtftk get_tx_seq -g simple.fa -l gene_id,transcript_id,feature,chrom,start,end,strand | head -n 2 + :shell: + + +**Arguments:** + +.. command-output:: gtftk get_tx_seq -h + :shell: + +------------------------------------------------------------------------------------------------------------------ + +get_feat_seq +~~~~~~~~~~~~~~~~~~~~~~ + +**Description:** Get feature sequence (e.g exon, UTR...). + + +**Example:** + +.. command-output:: gtftk get_feat_seq -i simple.gtf -g simple.fa -l feature,transcript_id,start -t exon -n | head -10 + :shell: + +**Arguments:** + +.. command-output:: gtftk get_feat_seq -h + :shell: + diff --git a/pygtftk/Line.py b/pygtftk/Line.py index a136da7b..c577d8e0 100644 --- a/pygtftk/Line.py +++ b/pygtftk/Line.py @@ -23,26 +23,10 @@ import pygtftk.utils import pygtftk.utils from pygtftk.utils import GTFtkError -from pygtftk.utils import PY3 from pygtftk.utils import write_properly ffi = FFI() -# --------------------------------------------------------------- -# Python2/3 compatibility -# --------------------------------------------------------------- - - -try: - basestring -except NameError: - basestring = str - -if PY3: - from io import IOBase - - file = IOBase - # --------------------------------------------------------------- # Classes FieldSet @@ -296,8 +280,10 @@ def __init__(self, ptr=None, alist=None): >>> from pygtftk.Line import Feature - >>> alist = ['chr1','Unknown','transcript', 100, 200] + >>> from pygtftk.utils import get_example_file + >>> from pygtftk.gtf_interface import GTF >>> from collections import OrderedDict + >>> alist = ['chr1','Unknown','transcript', 100, 200] >>> d = OrderedDict() >>> d['transcript_id'] = 'g1t1' >>> d['gene_id'] = 'g1' @@ -305,15 +291,10 @@ def __init__(self, ptr=None, alist=None): >>> a = Feature.from_list(alist) >>> assert a.get_tx_id() == 'g1t1' >>> assert a.get_gn_id() == 'g1' - >>> from pygtftk.utils import get_example_file - >>> import pygtftk - >>> from pygtftk.gtf_interface import GTF >>> a_file = get_example_file()[0] >>> a_gtf = GTF(a_file) >>> for i in a_gtf: pass - >>> assert type(i) == pygtftk.Line.Feature - - + >>> assert type(i) == Feature """ if ptr is not None: @@ -511,7 +492,7 @@ def format_tab(self, attr_list, sep="\t"): >>> assert feat.format_tab('transcript_id') == a """ - if isinstance(attr_list, basestring): + if isinstance(attr_list, str): attr_list = [attr_list] tok = list() @@ -580,7 +561,7 @@ def write_bed(self, pygtftk.utils.write_properly('\t'.join(token), outputfile) def write_gtf_to_bed6(self, - name=["transcript_id", "gene_id"], + name=("transcript_id", "gene_id"), sep="|", add_feature_type=False, outputfile=None): @@ -609,6 +590,11 @@ def write_gtf_to_bed6(self, """ + if isinstance(name, tuple): + name = list(name) + elif isinstance(name, str): + name = [name] + if pygtftk.utils.ADD_CHR == 1: chrom_out = "chr" + self.chrom else: @@ -840,7 +826,7 @@ def get_attr_value(self, attr_name, upon_none='continue'): """ - if isinstance(attr_name, basestring): + if isinstance(attr_name, str): attr_name = [attr_name] if not isinstance(attr_name, list): diff --git a/pygtftk/__init__.py b/pygtftk/__init__.py index 126b7d86..6b27d144 100644 --- a/pygtftk/__init__.py +++ b/pygtftk/__init__.py @@ -6,7 +6,7 @@ pygtftk.__NON_INTERACTIVE__ = False # ------------------------------------------------------------------------- -# We dont keep temp filesby default +# We dont keep temp files by default # ------------------------------------------------------------------------- pygtftk.__ARGS__ = dict() diff --git a/pygtftk/arg_formatter.py b/pygtftk/arg_formatter.py index d2d865c8..676c65f9 100644 --- a/pygtftk/arg_formatter.py +++ b/pygtftk/arg_formatter.py @@ -8,36 +8,20 @@ import argparse import glob +import io +import operator import os import re import sys -from builtins import object -from builtins import range from builtins import str -from collections import defaultdict +from functools import partial from pybedtools import BedTool -from pygtftk.utils import PY3 from pygtftk.utils import check_file_or_dir_exists from pygtftk.utils import chrom_info_as_dict from pygtftk.utils import message -# --------------------------------------------------------------- -# Python2/3 compatibility -# --------------------------------------------------------------- - - -try: - basestring -except NameError: - basestring = str - -if PY3: - from io import IOBase - - file = IOBase - # --------------------------------------------------------------- # ArgFormatter class @@ -86,7 +70,7 @@ def _get_help_string(self, action): if action.default is not argparse.SUPPRESS: defaulting_nargs = [argparse.OPTIONAL, argparse.ZERO_OR_MORE] if action.option_strings or action.nargs in defaulting_nargs: - if isinstance(action.default, file): + if isinstance(action.default, io.IOBase): help_str += ' (default: ' + \ str(action.default.name) + ')' else: @@ -153,8 +137,8 @@ def _format_usage(self, usage, actions, groups, prefix): positionals.append(action) # build full usage string - format = self._format_actions_usage - action_usage = format(optionals + positionals, groups) + format_fun = self._format_actions_usage + action_usage = format_fun(optionals + positionals, groups) usage = ' '.join([s for s in [prog, action_usage] if s]) # wrap the usage parts if it's too long @@ -163,8 +147,8 @@ def _format_usage(self, usage, actions, groups, prefix): # break usage into wrappable parts part_regexp = r'\(.*?\)+|\[.*?\]+|\S+' - opt_usage = format(optionals, groups) - pos_usage = format(positionals, groups) + opt_usage = format_fun(optionals, groups) + pos_usage = format_fun(positionals, groups) opt_parts = re.findall(part_regexp, opt_usage) pos_parts = re.findall(part_regexp, pos_usage) assert ' '.join(opt_parts) == opt_usage @@ -220,76 +204,75 @@ def get_lines(parts, indent, prefix=None): return '%s%s\n\n' % (prefix, usage) -class NumericRange(object): - """To be used in argparse. Ensure float is between start and end. - - :param start: lower range - :param end: upper range. - - :Example: - - >>> from pygtftk.arg_formatter import NumericRange - >>> assert 100 == NumericRange(100,200) - >>> assert 99 != NumericRange(100,200) - >>> assert 200 == NumericRange(100,200) - >>> assert 201 != NumericRange(100,200) - - """ - - def __init__(self, start, end): - self.start = start - self.end = end - - def __repr__(self): - msg = '{0} to {1}' - msg = msg.format(self.start, self.end) - return msg - - def __eq__(self, other): - return self.start <= other <= self.end +# --------------------------------------------------------------- +# Ensure a numeric is in range +# --------------------------------------------------------------- +def get_truth(inp, relate, cut): + ops = {'>': operator.gt, + '<': operator.lt, + '>=': operator.ge, + '<=': operator.le, + '=': operator.eq} + return ops[relate](inp, cut) -class NumericGreaterOrEqual(object): - """To be used in argparse. Ensure the numeric is greater or equal a define - value. - :param start: lower range +def ranged_num(lowest=-1, highest=1, val_type=("int", "float"), + linc=False, hinc=False): + """Check a numeric is in expected range. - :Example: + :param lowest: The lowest accepted value. + :param highest: The highest accepted value. + :param val_type: A float of int. + :param linc: The lowest value is included (<=). + :param hinc: The highest value is included (>=). - >>> from pygtftk.arg_formatter import NumericGreaterOrEqual - >>> assert str(NumericGreaterOrEqual(100)) == "100 or more" - >>> assert 100 == NumericGreaterOrEqual(100) - >>> assert 200 == NumericGreaterOrEqual(100) - >>> assert 20 != NumericGreaterOrEqual(100) """ - def __init__(self, start): - self.start = start + if linc: + lt = '<' + else: + lt = '<=' - def __repr__(self): - msg = '{0} or more' - msg = msg.format(str(self.start)) - return msg + if hinc: + gt = '>' + else: + gt = '>=' - def int(self): - return int(self.start) + def type_func(a_value): + if val_type == "int": + try: + a_value = int(a_value) + except: + raise argparse.ArgumentTypeError("Not an int.") + else: + try: + a_value = float(a_value) + except: + raise argparse.ArgumentTypeError("Not a float.") - def __eq__(self, other): - return int(other) >= int(self.start) + if lowest is None: + if highest is None: + return a_value + else: + if get_truth(a_value, gt, highest): + raise argparse.ArgumentTypeError("Value not in range.") + else: + if highest is None: + if get_truth(a_value, lt, lowest): + raise argparse.ArgumentTypeError("Value not in range.") + else: + if get_truth(a_value, lt, lowest) or get_truth(a_value, gt, highest): + raise argparse.ArgumentTypeError("Value not in range.") + return a_value -def int_ge_to_null(a_value): - """Check a numeric is an int greater or equal to 0.""" - try: - a_value = int(a_value) - except: - raise argparse.ArgumentTypeError("An integer with min value 1.") + return type_func - if a_value < 0: - raise argparse.ArgumentTypeError("Minimum value is 1.") - return a_value +# --------------------------------------------------------------- +# Check a numeric is an int greater than 0 +# --------------------------------------------------------------- def int_greater_than_null(a_value): """Check a numeric is an int greater than 0.""" @@ -302,126 +285,11 @@ def int_greater_than_null(a_value): return a_value -def int_greater_than_null_or_None(a_value): - """Check a numeric is an int greater than 0.""" - - if a_value is not None: - try: - a_value = int(a_value) - except: - raise argparse.ArgumentTypeError("An integer with min value 1.") - if a_value <= 0: - raise argparse.ArgumentTypeError("Minimum value is 1.") - return a_value - - -def float_greater_than_null(a_value): - """Check a numeric is a float greater than 0.""" - try: - a_value = float(a_value) - except: - raise argparse.ArgumentTypeError("Should be a float greater than 0.") - if a_value <= 0: - raise argparse.ArgumentTypeError("Should be a float greater than 0.") - return a_value - - -def float_grt_than_null_and_lwr_than_one(a_value): - """Check a numeric is a float greater than 0.""" - try: - a_value = float(a_value) - except: - raise argparse.ArgumentTypeError("Should be a float greater than 0.") - if a_value <= 0: - raise argparse.ArgumentTypeError("Should be a float greater than 0.") - if a_value > 1: - raise argparse.ArgumentTypeError( - "Should be a float lower or equal to 1.") - return a_value - - -class SeparatedList(object): - """To be used in argparse. Ensure this is a comma separated list of - the required type and required length. - - :param length: the required length. - :param type_arg: the required type. - :param sep: the separator. - :param check: also check that for two elements l[i] and l[+i] of the splited - list, 'l[i] op l[+i]' is True. The operator op can be one of ">", "<", "!=", - ">=" or ">=". - - :Example: - - >>> from pygtftk.arg_formatter import SeparatedList - >>> assert "1,2" == SeparatedList(length=2, type_arg=int, sep=",", check="<") - >>> assert "2,1" == SeparatedList(length=2, type_arg=int, sep=",", check=">") - >>> assert "2,1" == SeparatedList(length=2, type_arg=int, sep=",", check=None) - >>> assert "1-2" != SeparatedList(length=3, type_arg=int, sep="-") - """ - - def __init__(self, - length=2, - type_arg=int, - sep=",", - check=None): - self.length = length - self.type_arg = type_arg - self.sep = sep - self.check = check - - assert check in [">", "<", "!=", ">=", ">=", None] - - def __repr__(self): - sep = self.sep - if sep == " ": - sep = "space" - - msg = ': a separated list ("{2}") of {1} with {0} element(s)' - msg = msg.format(str(self.length), - re.sub("'.*", - "", - re.sub("^.*?'", - "", - str(self.type_arg))), sep) - if self.check is not None: - msg += ". Constrain: " + "list[i] " + self.check + "list[i + 1]." - - return msg - - def __eq__(self, other): - - assert isinstance(other, basestring) - other = other.split(self.sep) - - if self.type_arg == int: - try: - for i in range(len(other)): - other[i] = int(other[i]) - except: - return False - - if self.check is not None: - if len(other) > 1: - for i in range(len(other) - 1): - val_1 = other[i] - val_2 = other[i + 1] - to_test = str(val_1) + self.check + str(val_2) - - if not eval(to_test): - return False - - return len(other) == self.length - - -class NonChromFileError(Exception): - """ - Raised when we expect a chromosome file and did not get one - """ - pass - +# --------------------------------------------------------------- +# Check the chrom file format +# --------------------------------------------------------------- -class checkChromFile(argparse.Action): +class CheckChromFile(argparse.Action): """ Check the chromosome file exists and has the proper format. """ @@ -463,6 +331,11 @@ def __call__(self, setattr(namespace, self.dest, values) +# --------------------------------------------------------------- +# Returns chromfile as a dict +# --------------------------------------------------------------- + + class chromFileAsDict(argparse.Action): """ Check the chromosome file exists and has the proper format. @@ -505,9 +378,13 @@ def __call__(self, setattr(namespace, self.dest, values) -class bedFileList(argparse.Action): +# --------------------------------------------------------------- +# Check file is in bed6 format +# --------------------------------------------------------------- + +class bed6(argparse.Action): """ - Check these are bed files. + Check the BED file exist and has proper format. """ def __init__(self, @@ -540,122 +417,50 @@ def __call__(self, values, option_string=None): - values = values.split(",") - - for i in values: - - check_file_or_dir_exists(i) - - file_bo = BedTool(i) - try: - a = len(file_bo) - except IndexError: - msg = "Unable to load file: " + i + "." - message(msg, type="ERROR") - sys.exit() - - if len(file_bo) == 0: - msg = "It seems that file " + i.fn + " is empty." - message(msg, type="ERROR") - sys.exit() - - if file_bo.file_type != 'bed': - msg = "File {f} is not a valid bed file." - msg = msg.format(f=i.fn) - message(msg, type="ERROR") - sys.exit() - - values = [open(i, "r") for i in values] - - # Add the attribute - setattr(namespace, self.dest, values) - - -class bedFile(argparse.FileType): - """ - Check the BED file exist and has proper format. - """ - - def __init__(self, **kwargs): - - super(bedFile, self).__init__(**kwargs) - - def __call__(self, string): - - i = string - - check_file_or_dir_exists(i) - - try: - file_bo = BedTool(i) - a = len(file_bo) - except: - msg = "Unable to load file: " + i.fn + "." - message(msg, type="ERROR") - sys.exit() - - if len(file_bo) == 0: - msg = "It seems that file " + i.fn + " is empty." - message(msg, type="ERROR") - sys.exit() - - if file_bo.file_type != 'bed': - msg = "File {f} is not a valid bed file." - msg = msg.format(f=i.fn) - message(msg, type="ERROR") - sys.exit() - - return super(bedFile, self).__call__(string) - - -class bedFileWithUnambiguousNames(argparse.FileType): - """ - Check the BED file exist and has proper format. - """ - - def __init__(self, **kwargs): - - super(bedFileWithUnambiguousNames, self).__init__(**kwargs) - - def __call__(self, string): - - bedfile = string - - check_file_or_dir_exists(bedfile) + check_file_or_dir_exists(values) try: - file_bo = BedTool(bedfile) + file_bo = BedTool(values) a = len(file_bo) except: - msg = "Unable to load file: " + bedfile + "." + msg = "Unable to load file: " + values + "." message(msg, type="ERROR") sys.exit() if len(file_bo) == 0: - msg = "It seems that file " + bedfile + " is empty." + msg = "It seems that file " + values + " is empty." message(msg, type="ERROR") sys.exit() if file_bo.file_type != 'bed': msg = "File {f} is not a valid bed file." - msg = msg.format(f=bedfile) + msg = msg.format(f=values) message(msg, type="ERROR") sys.exit() - names = defaultdict(int) + names = set() for line in file_bo: - if len(line.fields) < 6: - message("Need a BED6 file.", type="ERROR") + if len(line.fields) != 6: + message("File -- " + values + " --Need a BED6 file.", type="ERROR") sys.exit() - names[line.name] += 1 - if names[line.name] > 1: - message("File -- " + bedfile + " -- Names (4th columns of the bed file) should be unambiguous.", + if line.strand not in ['-', '+', '.']: + message("File -- " + values + " -- strand is not in proper format", type="ERROR") + if line.name not in names: + names.add(line.name) + else: + message("File -- " + values + " -- Names (4th columns of the bed file) should be unambiguous.", type="ERROR") sys.exit() - return super(bedFileWithUnambiguousNames, self).__call__(string) + # Add the attribute + setattr(namespace, self.dest, values) + + +# --------------------------------------------------------------- +# Check all files exist in a glob +# --------------------------------------------------------------- class globbedFileList(argparse.Action): @@ -692,16 +497,27 @@ def __call__(self, namespace, values, option_string=None): - values = glob.glob(values) + + if "*" in values: + values = glob.glob(values) + else: + values = [values] check_file_or_dir_exists(values) + # values = [ io.TextIOWrapper(gzip.GzipFile(i, 'r')) if ".gz" in i else open(i, "r") for i in values] + values = [open(i, "r") for i in values] # Add the attribute setattr(namespace, self.dest, values) +# --------------------------------------------------------------- +# Check file extension +# --------------------------------------------------------------- + + class FileWithExtension(argparse.FileType): """ Declare and check file extensions. @@ -714,7 +530,7 @@ def __init__(self, mode='r', valid_extensions=None, **kwargs): def __call__(self, string): match = False if self.valid_extensions: - if isinstance(self.valid_extensions, basestring): + if isinstance(self.valid_extensions, str): if not string.endswith(self.valid_extensions): if re.search(self.valid_extensions, string): match = True @@ -731,7 +547,7 @@ def __call__(self, string): break if not match: - message('Not a valid filename extension', type="WARNING") + message('Not a valid filename extension :' + string, type="WARNING") message('Extension expected: ' + str(self.valid_extensions), type="ERROR") sys.exit() @@ -744,8 +560,57 @@ def __call__(self, string): os.makedirs(outputdir) # we will work with string - if PY3: - if 'w' in self._mode: - self._mode = 'w' + if 'w' in self._mode: + self._mode = 'w' return super(FileWithExtension, self).__call__(string) + + +# --------------------------------------------------------------- +# Pre-defined file types with extension constrains +# --------------------------------------------------------------- + + +# gtf +gtf_rwb = partial(FileWithExtension, valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$') + +# gtf file not gz +gtf_rw = partial(FileWithExtension, valid_extensions='\.[Gg][Tt][Ff]$') + +# gtf file or txt file +gtf_or_txt_rw = partial(FileWithExtension, valid_extensions=('\.[Gg][Tt][Ff]$', + '\.[Tt][Xx][Tt]', + '\.[Cc][Ss][Vv]', + '\.[Tt][Aa][Bb]', + '\.[Tt][Ss][Vv]')) + +# bed file not gz +bed_rw = partial(FileWithExtension, valid_extensions=('\.[Bb][Ee][Dd]$', + '\.[Bb][Ee][Dd]3$', + '\.[Bb][Ee][Dd]6$')) +# txt file +txt_rw = partial(FileWithExtension, valid_extensions=('\.[Tt][Xx][Tt]', + '\.[Cc][Ss][Vv]', + '\.[Dd][Ss][Vv]', + '\.[Tt][Aa][Bb]', + '\.[Tt][Ss][Vv]')) +# bigwig file +bw_rw = partial(FileWithExtension, valid_extensions=('\.[Bb][Ww]$', + '\.[Bb][Ii][Gg][Ww][Ii][Gg]$')) + +# bigwig file +gtf_or_bed_rwb = partial(FileWithExtension, valid_extensions=('\.[Gg][Tt][Ff](\.[Gg][Zz])?$', + '\.[Bb][Ee][Dd]$', + '\.[Bb][Ee][Dd]3$', + '\.[Bb][Ee][Dd]6$')) + +# fasta file +fasta_rw = partial(FileWithExtension, valid_extensions=('\.[Ff][Aa][Ss][Tt][Aa]$', + '\.[Ff][Nn][Aa]$', + '\.[Ff][Aa]$', + '\.[Ff][Aa][Ss]$', + '\.[Ff][Ff][Nn]$', + '\.[Ff][Rr][Nn]$')) + +# zip file +zip_rw = partial(FileWithExtension, valid_extensions='\.[Zz][Ii][Pp]$') diff --git a/pygtftk/biomart.py b/pygtftk/biomart.py index 504367af..3d9297db 100644 --- a/pygtftk/biomart.py +++ b/pygtftk/biomart.py @@ -2,7 +2,7 @@ import re import textwrap -import xml.etree.ElementTree as elmt_tree +import xml.etree.ElementTree as ElementTree from builtins import object from builtins import str from collections import defaultdict @@ -34,6 +34,7 @@ def __init__(self, self.databases = [] self.datasets = defaultdict(list) self._get_databases() + self.response = None def __repr__(self, *args, **kwargs): @@ -63,10 +64,10 @@ def _get_databases(self): message("Listing available databases", type="DEBUG") try: self.query(query={'type': 'registry'}) - except ConnectionError as err: + except ConnectionError: message("Raised a connection Error.", type="ERROR") - tree = elmt_tree.fromstring(self.response.content) + tree = ElementTree.fromstring(self.response.content) for child in tree: if child.tag == 'MartURLLocation': diff --git a/pygtftk/bwig/bw_coverage.py b/pygtftk/bwig/bw_coverage.py index a3ed012c..23ebe339 100644 --- a/pygtftk/bwig/bw_coverage.py +++ b/pygtftk/bwig/bw_coverage.py @@ -7,14 +7,16 @@ import os import pyBigWig import sys -from itertools import repeat - -import numpy as np from builtins import range from builtins import str from builtins import zip +from itertools import repeat +from tempfile import NamedTemporaryFile + +import numpy as np from pybedtools import BedTool +import pygtftk from pygtftk.utils import GTFtkError from pygtftk.utils import add_prefix_to_file from pygtftk.utils import close_properly @@ -23,6 +25,63 @@ from pygtftk.utils import make_tmp_file from pygtftk.utils import message +# ------------------------------------------------------------------------- +# TMP_FILE_POOL_MANAGER stores temporary file name +# make_tmp_file_pool is function that add temporary files to TMP_FILE_POOL_MANAGER +# TMP_FILE_POOL_MANAGER will be updated by workers (in contrast to a global +# variable) +# ------------------------------------------------------------------------- + +TMP_FILE_POOL_MANAGER = multiprocessing.Manager().list() + + +def make_tmp_file_pool(prefix='tmp', + suffix='', + store=True, + dir=None): + """ + This + + :Example: + + >>> from pygtftk.utils import make_tmp_file_pool + >>> tmp_file = make_tmp_file_pool() + >>> assert os.path.exists(tmp_file.name) + >>> tmp_file = make_tmp_file_pool(prefix="pref") + >>> assert os.path.exists(tmp_file.name) + >>> tmp_file = make_tmp_file_pool(suffix="suf") + >>> assert os.path.exists(tmp_file.name) + + """ + + dir_target = None + + if dir is None: + if pygtftk.utils.TMP_DIR is not None: + if not os.path.exists(pygtftk.utils.TMP_DIR): + msg = "Creating directory {d}." + message(msg.format(d=pygtftk.utils.TMP_DIR), type="INFO") + os.mkdir(pygtftk.utils.TMP_DIR) + dir_target = pygtftk.utils.TMP_DIR + + else: + if not os.path.exists(dir): + msg = "Creating directory {d}." + message(msg.format(d=dir), type="INFO") + os.mkdir(dir) + dir_target = dir + + tmp_file = NamedTemporaryFile(delete=False, + mode='w', + prefix=prefix + "_pygtftk_", + suffix=suffix, + dir=dir_target) + + if store: + TMP_FILE_POOL_MANAGER.append(tmp_file.name) + + return tmp_file + # ------------------------------------------------------------------------- # Define the job of a single worker whose job is to compute mean coverage @@ -57,8 +116,6 @@ def _big_wig_coverage_worker(input_values): :param verbose: run in verbose mode. """ - from pygtftk.utils import WARN_REGION_SIZE - from pygtftk.utils import WARN_UNDEF (span, bw_list, region_bed_file_name, @@ -75,7 +132,7 @@ def _big_wig_coverage_worker(input_values): else: if bin_nb < 1: bin_nb = 1 - matrix_file = make_tmp_file(prefix="worker_coverage_") + matrix_file = make_tmp_file_pool(prefix="worker_coverage_", suffix=".txt") for cpt, big_wig in enumerate(bw_list): @@ -106,15 +163,13 @@ def _big_wig_coverage_worker(input_values): nb += 1 if nb == nb_to_do: - message(str(multiprocessing.current_process().name) + - " has processed " + - str(nb) + - " regions") + p_name = str(multiprocessing.current_process().name) + message(p_name + " has processed " + str(nb) + " regions") if (i.end - i.start) < bin_nb: - if WARN_REGION_SIZE: - WARN_REGION_SIZE = False + if pygtftk.utils.WARN_REGION_SIZE: + pygtftk.utils.WARN_REGION_SIZE = False message("Encountered regions shorter than bin number.", type="WARNING") message(i.name + @@ -169,18 +224,19 @@ def _big_wig_coverage_worker(input_values): out = [pc if np.isnan(k) else k + pc for k in out] except: - if WARN_UNDEF: + if pygtftk.utils.WARN_UNDEF: + pygtftk.utils.WARN_UNDEF = False + mesg = "Encountered regions undefined in bigWig file." message(mesg, type="WARNING") - mesg = '%s:%s-%s' % (i.chrom, - str(i.start), str(i.end)) + mesg = '%s:%s-%s' % (i.chrom, str(i.start), str(i.end)) message(mesg) - WARN_UNDEF = False if zero_to_na: out = ['NA'] * bin_nb else: out = [pc] * bin_nb + # Prepare output if i.name in ["", "."]: name = "|".join([i.chrom, @@ -400,7 +456,6 @@ def bw_profile_mp(in_bed_file=None, repeat(stat), repeat(verbose))) - for res_file_list in pool.map_async(_big_wig_coverage_worker, argss).get(999999): diff --git a/pygtftk/cmd_manager.py b/pygtftk/cmd_manager.py index e8eeb16f..b3748237 100644 --- a/pygtftk/cmd_manager.py +++ b/pygtftk/cmd_manager.py @@ -7,7 +7,7 @@ import argparse import errno import glob -import imp +import io import logging import os import re @@ -19,7 +19,7 @@ from builtins import object from builtins import range from builtins import str -from subprocess import Popen, PIPE +from importlib.machinery import SourceFileLoader from sys import platform import cloudpickle @@ -31,26 +31,12 @@ import pygtftk.settings import pygtftk.utils from pygtftk.arg_formatter import ArgFormatter -from pygtftk.utils import PY2 -from pygtftk.utils import PY3 -from pygtftk.utils import add_r_lib -from pygtftk.utils import check_r_packages from pygtftk.utils import left_strip_str from pygtftk.utils import make_tmp_dir from pygtftk.utils import message from pygtftk.utils import mkdir_p -from pygtftk.utils import print_table from pygtftk.version import __version__ -# --------------------------------------------------------------- -# Python2/3 compatibility -# --------------------------------------------------------------- - -if PY3: - from io import IOBase - - file = IOBase - # --------------------------------------------------------------- # Changing argparse._SubParsersAction to allow subgroups of @@ -109,7 +95,6 @@ def __init__(self, option_strings, dest, nargs=None, **kwargs): option_strings, dest, **kwargs) def __call__(self, parser, namespace, values, option_string=None): - reload(pygtftk.settings) print(pygtftk.settings.get_completion_script()) sys.exit() @@ -131,35 +116,6 @@ def __call__(self, parser, namespace, values, option_string=None): sys.exit() -# --------------------------------------------------------------- -# An additional action that print required R libraries -# --------------------------------------------------------------- -# Deprecated - -class RequiredRLib(argparse._StoreTrueAction): - """A class to be used by argparser to get bash completion.""" - - def __init__(self, option_strings, dest, nargs=None, **kwargs): - super(RequiredRLib, self).__init__( - option_strings, dest, **kwargs) - - def __call__(self, parser, namespace, values, option_string=None): - - table = [] - table += [("Plugin", "R_library", "Found")] - print("") - - for i in pygtftk.utils.R_LIB: - for j in pygtftk.utils.R_LIB[i]: - found = check_r_packages([j], no_error=True) - if found: - table += [(i, j, "YES")] - else: - table += [(i, j, "NO")] - print_table(table) - sys.exit() - - # --------------------------------------------------------------- # An additional action to get all tests # --------------------------------------------------------------- @@ -343,16 +299,16 @@ def __call__(self, parser, namespace, values, option_string=None): # An additional action to get information about the environment # --------------------------------------------------------------- -class getSysInfo(argparse._StoreTrueAction): +class GetSysInfo(argparse._StoreTrueAction): """A class to be used by argparser to get information about the environment.""" def __init__(self, option_strings, dest, nargs='+', **kwargs): - super(getSysInfo, self).__init__(option_strings, dest, **kwargs) + super(GetSysInfo, self).__init__(option_strings, dest, **kwargs) def __call__(self, parser, namespace, values, option_string=None): from pandas import __version__ as pandas_ver from pybedtools import __version__ as pybedtools_ver - from pyBigWig import __version__ as pyBigWig_ver + from pyBigWig import __version__ as bigwig_ver from pygtftk import __path__ as pygtftk_path import subprocess from pygtftk.utils import chomp @@ -367,7 +323,7 @@ def __call__(self, parser, namespace, values, option_string=None): stdout=subprocess.PIPE).stdout.read().decode()) info_sys += ['- Bedtools version : ' + bedtools_ver] info_sys += ['- pybedtools version : ' + pybedtools_ver] - info_sys += ['- pyBigWig version : ' + pyBigWig_ver] + info_sys += ['- pyBigWig version : ' + bigwig_ver] info_sys += ['- uname : ' + str(os.uname())] print("\n".join(info_sys)) sys.exit() @@ -377,11 +333,11 @@ def __call__(self, parser, namespace, values, option_string=None): # An additional action to get plugin path # --------------------------------------------------------------- -class getPluginPath(argparse._StoreTrueAction): +class GetPluginPath(argparse._StoreTrueAction): """A class to be used by argparser to plugin path.""" def __init__(self, option_strings, dest, nargs='+', **kwargs): - super(getPluginPath, self).__init__(option_strings, dest, **kwargs) + super(GetPluginPath, self).__init__(option_strings, dest, **kwargs) def __call__(self, parser, namespace, values, option_string=None): print(CmdManager.config_dir) @@ -435,19 +391,11 @@ class CmdManager(object): """ - if PY2: - parser = argparse.ArgumentParser( - formatter_class=ArgFormatter, - description=prg_desc, - epilog="------------------------\n", - version='%(prog)s v{0}'.format(__version__) - ) - if PY3: - parser = argparse.ArgumentParser( - formatter_class=ArgFormatter, - description=prg_desc, - epilog="------------------------\n" - ) + parser = argparse.ArgumentParser( + formatter_class=ArgFormatter, + description=prg_desc, + epilog="------------------------\n" + ) parser._optionals.title = "Main command arguments" @@ -469,36 +417,16 @@ class CmdManager(object): parser.add_argument('-s', '--system-info', nargs=0, help="Display some info about the system.", - action=getSysInfo) + action=GetSysInfo) parser.add_argument('-d', '--plugin-path', nargs=0, help="Print plugin path", - action=getPluginPath) - - if PY3: - parser.add_argument('-v', '--version', - action='version', - version='%(prog)s v{0}'.format(__version__)) - - """ - parser.add_argument('-r', '--r-libs', - nargs=0, - help="Print required R libraries.", - action=RequiredRLib) - - - parser.add_argument('-a', '--add-plugin', - nargs=3, - help="Add plugins from a git repository: -a repository[,relative/path][,*.py].", - action=AddPlugin) + action=GetPluginPath) - parser.add_argument('-u', '--update-plugins', - nargs=0, - help="Enforce gtftk to search for new plugins in dedicated folders.", - action=UpdatePlugin) - - """ + parser.add_argument('-v', '--version', + action='version', + version='%(prog)s v{0}'.format(__version__)) parser.add_argument('-l', '--list-plugins', nargs=0, @@ -522,16 +450,11 @@ class CmdManager(object): # Declare subparser groups # geno_info, edition, selection, conversion, annotation, info, coverage, sequence - grp_editing = sub_parsers.add_parser_group( - '\n------- Editing --------\n') - grp_info = sub_parsers.add_parser_group( - '\n----- Information ------\n') - grp_select = sub_parsers.add_parser_group( - '\n------ Selection -------\n') - grp_convert = sub_parsers.add_parser_group( - '\n------ Conversion ------\n') - grp_annot = sub_parsers.add_parser_group( - '\n------ Annotation ------\n') + grp_editing = sub_parsers.add_parser_group('\n------- Editing --------\n') + grp_info = sub_parsers.add_parser_group('\n----- Information ------\n') + grp_select = sub_parsers.add_parser_group('\n------ Selection -------\n') + grp_convert = sub_parsers.add_parser_group('\n------ Conversion ------\n') + grp_annot = sub_parsers.add_parser_group('\n------ Annotation ------\n') grp_seq = sub_parsers.add_parser_group('\n------- Sequence -------\n') grp_coord = sub_parsers.add_parser_group('\n----- Coordinates ------\n') grp_cov = sub_parsers.add_parser_group('\n------- Coverage -------\n') @@ -770,91 +693,44 @@ def add_command(cls, cmd): # Update the global argument parser + arg_dict = {'name': cmd.name, + 'formatter_class': ArgFormatter, + 'parents': [cmd.parser], + 'help': cmd.message, + 'add_help': False, + 'description': cmd.desc} if cmd.group == 'editing': - cls.grp_editing.add_parser( - cmd.name, - formatter_class=ArgFormatter, - parents=[cmd.parser], - help=cmd.message, - add_help=False, - description=cmd.desc) + cls.grp_editing.add_parser(**arg_dict) elif cmd.group == 'information': - cls.grp_info.add_parser( - cmd.name, - formatter_class=ArgFormatter, - parents=[cmd.parser], - help=cmd.message, - add_help=False, - description=cmd.desc) + cls.grp_info.add_parser(**arg_dict) elif cmd.group == 'selection': - cls.grp_select.add_parser( - cmd.name, - formatter_class=ArgFormatter, - parents=[cmd.parser], - help=cmd.message, - add_help=False, - description=cmd.desc) + cls.grp_select.add_parser(**arg_dict) elif cmd.group == 'conversion': - cls.grp_convert.add_parser( - cmd.name, - formatter_class=ArgFormatter, - parents=[cmd.parser], - help=cmd.message, - add_help=False, - description=cmd.desc) + cls.grp_convert.add_parser(**arg_dict) elif cmd.group == 'coordinates': - cls.grp_coord.add_parser( - cmd.name, - formatter_class=ArgFormatter, - parents=[cmd.parser], - help=cmd.message, - add_help=False, - description=cmd.desc) + cls.grp_coord.add_parser(**arg_dict) elif cmd.group == 'annotation': - cls.grp_annot.add_parser( - cmd.name, - formatter_class=ArgFormatter, - parents=[cmd.parser], - help=cmd.message, - add_help=False, - description=cmd.desc) + cls.grp_annot.add_parser(**arg_dict) elif cmd.group == 'sequences': - cls.grp_seq.add_parser( - cmd.name, - formatter_class=ArgFormatter, - parents=[cmd.parser], - help=cmd.message, - add_help=False, - description=cmd.desc) + cls.grp_seq.add_parser(**arg_dict) elif cmd.group == 'coverage': - cls.grp_cov.add_parser( - cmd.name, - formatter_class=ArgFormatter, - parents=[cmd.parser], - help=cmd.message, - add_help=False, - description=cmd.desc) + cls.grp_cov.add_parser(**arg_dict) elif cmd.group == 'miscellaneous': - cls.grp_misc.add_parser( - cmd.name, - formatter_class=ArgFormatter, - parents=[cmd.parser], - help=cmd.message, - add_help=False, - description=cmd.desc) + cls.grp_misc.add_parser(**arg_dict) else: raise ValueError("Unknow group for commande : %s" % cmd.name) - def _find_plugins(self): + @staticmethod + def _find_plugins(): message("Searching plugins", force=True) config_file = CmdManager.config_file @@ -887,7 +763,8 @@ def _find_plugins(self): try: - imp.load_source(module_name, plug) + SourceFileLoader(module_name, plug).load_module() + except Exception as e: message("Failed to load plugin :" + plug, type="WARNING") print(e) @@ -906,10 +783,7 @@ def dump_plugins(self): message("Dumping plugins", force=True) - if PY2: - f_handler = open(CmdManager.dumped_plugin_path, "w") - if PY3: - f_handler = open(CmdManager.dumped_plugin_path, "wb") + f_handler = open(CmdManager.dumped_plugin_path, "wb") pick = cloudpickle.CloudPickler(f_handler) pick.dump((self.cmd_obj_list, self.parser)) @@ -934,25 +808,16 @@ def load_plugins(self): self._load_dumped_plugins() - def _load_dumped_plugins(self): + @staticmethod + def _load_dumped_plugins(): - if PY2: - f_handler = open(CmdManager.dumped_plugin_path, "r") - CmdManager.cmd_obj_list, CmdManager.parser = cloudpickle.load(f_handler) - if PY3: - f_handler = open(CmdManager.dumped_plugin_path, "rb") - CmdManager.cmd_obj_list, CmdManager.parser = cloudpickle.load(f_handler) + f_handler = open(CmdManager.dumped_plugin_path, "rb") + CmdManager.cmd_obj_list, CmdManager.parser = cloudpickle.load(f_handler) f_handler.close() for cur_cmd in sorted(CmdManager.cmd_obj_list): - # Update the list of required R libraries - - # message("Loading " + cur_cmd, type="DEBUG", force=True) - if CmdManager.cmd_obj_list[cur_cmd].rlib is not None: - add_r_lib(libs=CmdManager.cmd_obj_list[cur_cmd].rlib, - cmd=cur_cmd) - + # fix some issues related to dumping of the parser for cur_arg in CmdManager.cmd_obj_list[cur_cmd].parser._option_string_actions: obj = CmdManager.cmd_obj_list[ @@ -1016,7 +881,7 @@ def run(cls, args): # .pyc -> .py fun_path = cmd_ob.fun.rstrip("c") - tmp_module = imp.load_source('tmp_module', fun_path) + tmp_module = SourceFileLoader('tmp_module', fun_path).load_module() fun = getattr(tmp_module, args['command']) # Save args to log file @@ -1048,34 +913,14 @@ def run(cls, args): cmd_ob.logger.info("Command: " + " ".join(sys.argv)) cmd_ob.logger.info("Argument: " + 'command=' + args['command']) - del args['command'] - for key, value in list(args.items()): - if isinstance(value, file): + if isinstance(value, io.IOBase): value = value.name else: value = str(value) cmd_ob.logger.info("Argument: " + key + "=" + value) - try: - del args['command'] - except KeyError: - pass - - # Delete arg that won't be used by supparsers - for key_arg in ['bash_comp', 'add_chr', 'version', 'help', - 'plugin_tests', 'list_plugins', 'plugin_tests_no_conn', - 'r_libs', 'add_plugin', 'update_plugins', 'system_info', - 'plugin_path']: - try: - del args[key_arg] - except: - pass - - # Call the command function - if cmd_ob.lang == "Python": - # Set the level of verbosity # Can be None if -V is used without value # (nargs) @@ -1088,26 +933,20 @@ def run(cls, args): # output file if args['no_date']: pygtftk.utils.ADD_DATE = False - del args['no_date'] - del args['keep_all'] + arg_list_to_del = ['bash_comp', 'add_chr', 'version', 'help', + 'plugin_tests', 'list_plugins', 'plugin_tests_no_conn', + 'r_libs', 'add_plugin', 'update_plugins', 'system_info', + 'plugin_path', 'no_date', 'keep_all', 'logger_file', + 'tmp_dir', 'verbosity', 'command'] + for cur_arg in arg_list_to_del: + try: + del args[cur_arg] + except KeyError: + pass + # Run the command fun(**args) - elif cmd_ob.lang == "R": - - sys_cmd = "" - for k, a_value in list(args.items()): - - if a_value is not False and a_value is not True: - sys_cmd += " --" + k.replace("_", "-") + " " + str(a_value) - else: - sys_cmd += " --" + k.replace("_", "-") + " " - - sys_cmd = "Rscript " + cmd_ob.fun + " " + sys_cmd - shell_out = Popen(sys_cmd, shell=True, stdout=PIPE) - - for line in shell_out.stdout: - sys.stderr.write(line) else: raise ValueError("Unknow language.") diff --git a/pygtftk/cmd_object.py b/pygtftk/cmd_object.py index ff45fee5..11d1da92 100644 --- a/pygtftk/cmd_object.py +++ b/pygtftk/cmd_object.py @@ -8,6 +8,7 @@ from builtins import object from builtins import range +import pygtftk import pygtftk.cmd_manager diff --git a/pygtftk/data/mini_real_10M/chr1_hg38_10M.fa.gz b/pygtftk/data/mini_real_10M/chr1_hg38_10M.fa.gz new file mode 100644 index 00000000..3f8b904a Binary files /dev/null and b/pygtftk/data/mini_real_10M/chr1_hg38_10M.fa.gz differ diff --git a/pygtftk/data/mini_real_10M/expected_sequence_minus_exon.fa b/pygtftk/data/mini_real_10M/expected_sequence_minus_exon.fa new file mode 100644 index 00000000..b4a379e2 --- /dev/null +++ b/pygtftk/data/mini_real_10M/expected_sequence_minus_exon.fa @@ -0,0 +1,266 @@ +>ENSE00001611509 +ATCAAGTTCGAGAAAGACCTGAGGCGCATCTGGCTGAAGGCGGGGCTAAAGGAAGCCCCCGAAGGCTGGCAGACCCCCAAGATCTACCTGCGGGGCAAATGAGTCTGGCGCCGCCCTTCCCGCCCGTTGCTGCTGTGATCCGTAGTAATAAATTCTCAGAGGACTCAGCCTTT +>ENSE00001790281 +ATCAAGTTCGAGAAAGACCTGAGGCGCATCTGGCTGAAGGCGGGGCTAAAGGAAGCCCCCGAAGGCTGGCAGACCCCCAAGATCTACCTGCGGGGCAAATGAGTCTGGCGCCGCCCTTCCCGCCCGTTGCTGCTGTGATCCGTAGTAATAAATTCTCAGAGGACTCAGCCT +>ENSE00001842703 +ATCAAGTTCGAGAAAGACCTGAGGCGCATCTGGCTGAAGGCGGGGCTAAAGGAAGCCCCCGAAGGCTGGCAGACCCCCAAGATCTACCTGCGGGGCAAATGAGTCTGGCGCCGCCCTTCCCGCCCGTTGCTGCTGTGATCCGTAGTAATAAATTCTCAGAGGACTC +>ENSE00001629775 +GCGGCCGCCCGCCTTGGCCCGTCTCTGGAGTGCTGGGCAGCCGGGTCTGCGGGCCCCTTTACAGCACATCGCCGGCCGGCCCAGGTAGGGCGGCCTCTCTCCCTCGCAAGGGGGCCCAGCTGGAGCTGGAGGAGATGCTGGTCCCCAGGAAGATGTCCGTCAGCCCCCTGGAGAGCTGGCTCACGGCCCGCTGCTTCCTGCCCAGACTGGATACCGGGACCGCAGGGACTGTGGCTCCACCGCAATCCTACCAGTGTCCGCCCAGCCAGATAGGGGAAGGGGCCGAGCAGGGGGATGAAGGCGTCGCGGATGCGCCTCAAATTCAGTGCAAAAACGTGCTGAAGATCCGCCGGCGGAAGATGAACCACCACAAGTACCGGAAGCTGGTGAAGAAGACGCGGTTCCTGCGGAGGAAGGTCCAGGAGGGACGCCTGAGACGCAAGCAG +>ENSE00001922199 +CTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAGGTAGGAAGCCGCGCGGGGGCGGATGGGAGGATGCACACCTGGTTAGGAGTGCGGGTCTCAGCAGCTCCGCTGGGGCAGGGCCGGTGGCCACACACACACTCTTTCCCCTCTAAGCTTCCGATGCTCACAGAGGGAACCTCAGGGGTTCAGGCCAGGAATGAGGTGCGGGGGATCCTCGCTGGGACGAACCTGCTGCTCCTCAACCCGACGGGCCTGTGTGGTCTCGCGAGCGGTGACCGTGGCGTCTGGTTTTCTGCAGGCGGCCGCCCGCCTTGGCCCGTCTCTGGAGTGCTGGGCAGCCGGGTCTGCGGGCCCCTTTACAGCACATCGCCGGCCGGCCCAGGTAGGGCGGCCTCTCTCCCTCGCAAGGGGGCCCAGCTGGAGCTGGAGGAGATGCTGGTCCCCAGGAAGATGTCCGTCAGCCCCCTGGAGAGCTGGCTCACGGCCCGCTGCTTCCTGCC +>ENSE00001821535 +CTTCCGATGCTCACAGAGGGAACCTCAGGGGTTCAGGCCAGGAATGAGGTGCGGGGGATCCTCGCTGGGACGAACCTGCTGCTCCTCAACCCGACGGGCCTGTGTGGTCTCGCGAGCGGTGACCGTGGCGTCTGGTTTTCTGCAGGCGGCCGC +>ENSE00001789693 +CTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAG +>ENSE00001896016 +GTCGAGGTCGGGCTTGGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGGGTCCGGGCGCCAGGCAACGCGATTCGCGCGGGGGTGAACCCGGGGAGGGGGCCGGCCTCCCCGTTCTGGGACCTTTCGGTGCGTCCGAGCGCGACACCGCCCGCGTCGGGGGCTTGGGAGCCTCGGGGCGCGAGCTGTGTTGGAAGCAAAGTCCTCCTTGTGGGTTGGGGTGGCGGAGGGAGAAGGGAAGCGAGGGTCGCGGCGGGACCAGACGCCCCAGTCCCGGCCCGCCCGCGACTACTGAAGGCGCTGCCGCCTGACCTGAACGGGCACTTGTGTTCCAGCTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAG +>ENSE00001223521 +CGAGGTCGGGCTTGGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGGGTCCGGGCGCCAGGCAACGCGATTCGCGCGGGGGTGAACCCGGGGAGGGGGCCGGCCTCCCCGTTCTGGGACCTTTCGGTGCGTCCGAGCGCGACACCGCCCGCGTCGGGGGCTTGGGAGCCTCGGGGCGCGAGCTGTGTTGGAAGCAAAGTCCTCCTTGTGGGTTGGGGTGGCGGAGGGAGAAGGGAAGCGAGGGTCGCGGCGGGACCAGACGCCCCAGTCCCGGCCCGCCCGCGACTACTGAAGGCGCTGCCGCCTGACCTGAACGGGCACTTGTGTTCCAGCTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAG +>ENSE00001921648 +GGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGGGTCCGGGCGCCAGGCAACGCGATTCGCGCGGGGGTGAACCCGGGGAGGGGGCCGGCCTCCCCGTTCTGGGACCTTTCG +>ENSE00001479025 +TCAATTTGAGCCGCGTCGAGGTCGGGCTTGGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGGGTCCGGGCGCCAGGCAACGCGATTCGCGCGGGGGTGAACCCGGGGAGGGGGCCGGCCTCCCCGTTCTGGGACCTTTCG +>ENSE00001479027 +TTTGAGCCGCGTCGAGGTCGGGCTTGGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGG +>ENSE00001697866 +GGAATCCGGCCCCTGGGTGGTCCGGAAACGATTCTGGACCTGCGGGTATATCCAGGGCCCGCACCCCCTGGGATTGTGGGAAATGTAGTTTTTTGCCTCCGTAAGGGACCAGGCGGAGCTGAGGAACCGCGCGAGGACTGGGACCGTGATTCCACTAACCGGAAACCGTCGCCTTTCGGGCCCGGCGGGGCCTGAGCCAATGCAGAATCGGGGGCCGCGAGGACGCCAGCGGGCGCTGTGCGTAGGAACCGCCGGGTGGCCGCTGCCGATCGGGGCCGACTTGGGGACGGACCGGAAGTGCCCGAGGGCGGCCGCAGAACGGTCAATTTGAGCCGCGTCGAG +>ENSE00001478064 +CCTACAGCTCCGTGCAGTACCCACTGGGCATGCGGTTGCCCCTGCCCTTTGGGGAGCTGGACCTGGACTCCATGGCTCCTCCTGCCTACAGCCTGTACACCCCGGAGCCTCCACCCTCCTACGATGAAGCTGTCAAGATGGCCAAGCCCAGAGAGGAAGGACCAGCACTCTCCCAGAAACCCAGCCCTCTCCTTGGGGCCTCGGGCCTAGAGACCACTCCAGTGCCCCAGGAGTCGGGCCCCAATACTCAACTACCACCTTGTAGCCCTGGTGCCCCTTGAAGGAGGTAGGAGAACGGACCAGAGCTTGGAGAACTAATGCTTGGAGCCAAGGGCCCCAGCCCACCCCACCGTCCCACACATTGCTGTGGCCCCAACCTCGGTGCCATGTTACACCGGCCCCTGGCGTCACCCACTAGGCAGGCTGCTGCTTTCAGCCTCAGCCCCTGGCCCAGCCCCAGCAGGCCCTCAGCCTGGAAGAGGCCCCTTGGGCCTAAGCCTCGGGTGGGAGCTCAGGGCCACCTGTGACGTCTGCATCTTCTTGGAGAGAGAATAAAGTTTGTATTTAAGTGGT +>ENSE00001754010 +CCTACAGCTCCGTGCAGTACCCACTGGGCATGCGGTTGCCCCTGCCCTTTGGGGAGCTGGACCTGGACTCCATGGCTCCTCCTGCCTACAGCCTGTACACCCCGGAGCCTCCACCCTCCTACGATGAAGCTGTCAAGATGGCCAAGCCCAGAGAGGAAGGACCAGCACTCTCCCAGAAACCCAGCCCTCTCCTTGGGGCCTCGGGCCTAGAGACCACTCCAGTGCCCCAGGAGTCGGGCCCCAATACTCAACTACCACCTTGTAGCCCTGGTGCCCCTTGAAGGAGGTAGGAGAACGGACCAGAGCTTGGAGAACTAATGCTTGGAGCCAAGGGCCCCAGCCCACCCCACCGTCCCACACATTGCTGTGGCCCCAACCTCGGTGCCATGTTACACCGGCCCCTGGCGTCACCCACTAGGCAGGCTGCTGCTTTCAGCCTCAGCCCCTGGCCCAGCCCCAGCAGGCCCTCAGCCTGGAAGAGGCCCCTTGGGCCTAAGCCTCGGGTGGGAGCTCAGGGCCACCTGTGACGTCTGCATCTTCTTGGAGAGAGAATAAAGTTTGTATTTAAGTGG +>ENSE00001478051 +CCTGTACACCCCGGAGCCTCCACCCTCCTACGATGAAGCTGTCAAGATGGCCAAGCCCAGAGAGGAAGGACCAGCACTCTCCCAGAAACCCAGCCCTCTCCTTGGGGCCTCGGGCCTAGAGACCACTCCAGTGCCCCAGGAGTCGGGCCCCAATACTCAACTACCACCTTGTAGCCCTGGTGCCCCTTGAAGGAGGTAGGAGAACGGACCAGAGCTTGGAGAACTAA +>ENSE00001810932 +CCTACAGCTCCGTGCAGTACCCACTGGGCATGCGGTTGCCCCTGCCCTTTGGGGAGCTGGACCTGGACTCCATGGCTCCTCCTGCCTACAGCCTGTACACCCCGGAGCCTCCACCCTCCTACGATGAAGCTGTCAAGATGGCCAAGCCCAGAGAGGAAGGACCAGCACTCTCCCAGAAACCCAGCCCTCTCCTTGGGGCCTCGGGCCTAGAGACCACTCCAGTGCC +>ENSE00003350147 +CCTACAGCTCCGTGCAGTACCCACTGGGCATGCGGTTGCCCCTGCCCTTTGGGGAGCTGGACCT +>ENSE00003428438 +GTGCCCGCCCCAGGCCCGCTGGAGCAGCCTGTGGCACGTGGGGTAAGTGGAGGCCGCGGCGGAGCCGTGCGTCCGACGGTTCTGGGGCGGGGGTCACCGGGGCCAGGCCCGCCAGGCCCTTACCTCACCAGGCCGCCTCCGCTGTCGCCCAGTCCCGGCCGCTGGCGGGAACTGACCTGGAGCAAGCAGGACCTTCCCTCCCACCTCTCCCGCCTGGCCTCCGCGGGAGTCCCCTACGATCCCGCTCAGCAGTGGGGCACTCGCTGAGGACAGCGAGTCCTGGGAGTGAGCCCAAGGCCACCCCTGGCCAGCCCAGGAGAGATAGCCAGGGCAGGCCCAGCAGCCCGAGGCCAGGCTCTGGCCACGGCGGTCTCCGACATGGAGAGACATTGTCTGCTTTTTATCCTGTTAACCTGTCTTCGGTGGTTGTGCCACGACATTCCCCAGGGTGCAGGTGCCCGGTGGCCGAGGGTCAGTCCAGTGGTAGAGCCTTGCTCTCCTAGGCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACAGCTGGTTGTGTCCGGTTCTGCTGCCTCCGGAAGCAGGCACAGGCCCAGCCACATCTGCCACCAGCACGGCAGCCCTGCGACGTGGCAGTCATCCCTATGGACAGTGACAGCCCTGTACACAGCACTGTGACCT +>ENSE00003652520 +GCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACAGCTGGTTGTGTCCGGTTCTGCTGCCTCCGGAAGCAGGCACAGGCCCAGCCACATCTGCCACCAGCACGGCAGCCCTGCGACGTGGCAGTCATCCCTATGGACAGTGACAGCCCTGTACACAGCACTGTGACCT +>ENSE00003675447 +GCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACAGCTGGTTGTGTCCGGTTCTGCTGCCTCCGGAAGCAGGCACAGGCCCAGCCACATCTGCCACCAGCACGGCAGCCCTGCGACGTGGCAGTCATCCCTATGGACAGTGACAGCCCTGTACACAGCACTGTGACCT +>ENSE00001858191 +TCCGCTGTCGCCCAGTCCCGGCCGCTGGCGGGAACTGACCTGGAGCAAGCAGGACCTTCCCTCCCACCTCTCCCGCCTGGCCTCCGCGGGAGTCCCCTACGATCCCGCTCAGCAGTGGGGCACTCGCTGAGGACAGCGAGTCCTGGGAGTGAGCCCAAGGCCACCCCTGGCCAGCCCAGGAGAGATAGCCAGGGCAGGCCCAGCAGCCCGAGGCCAGGCTCTGGCCACGGCGGTCTCCGACATGGAGAGACATTGTCTGCTTTTTATCCTGTTAACCTGTCTTCGGTGGTTGTGCCACGACATTCCCCAGGGTGCAGGTGCCCGGTGGCCGAGGGTCAGTCCAGTGGTAGAGCCTTGCTCTCCTAGGCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACAGCTGGTTGTGTCCGGTTCTGCTGCCTCCGGAAGCAGGCACAGGCCCAGCCACATCTGCCACCAGCACGGCAGCCCTGCGACGTGGCAGTCATCCCTATGGACAGTGACAGCCCTGTACACAGCACTGTGACCT +>ENSE00001682091 +GCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACA +>ENSE00003599669 +GTGCCCGCCCCAGGCCCGCTGGAGCAGCCTGTGGCACGTGGG +>ENSE00003634508 +GTGCCCGCCCCAGGCCCGCTGGAGCAGCCTGTGGCACGTGGG +>ENSE00001937932 +GTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCAGTAAGTCGGGGGGGAGGGAGCCGGGGCCTGGCCCCGCCCTATGGGGAGGCACGGGTGGCGAGGTCGGCCGTCCCATGCCCCGCCTGCTCCAGGTGCCGCCGTCCCCACAGGTGCCCGCCCCAGGCCCGCTGGAGCAGCCTGTGGCACGTGGG +>ENSE00001767147 +GAGCATGGCCCGGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAGGTGGGTCGGGCGGCGTTCTCTCTCGGTTCGGCCACCGCGGGGCGGGTCCCTGCTCGGACCACGCCCCTCCCGGGCTCACCCTTGTCCCCACAGGTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCA +>ENSE00001736550 +GGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAGGTGGGTCGGGCGGCGTTCTCTCTCGGTTCGGCCACCGCGGGGCGGGTCCCTGCTCGGACCACGCCCCTCCCGGGCTCACCCTTGTCCCCACAGGTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCA +>ENSE00003473336 +GTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCA +>ENSE00003561172 +GTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCA +>ENSE00003343061 +GAGCATGGCCCGGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAG +>ENSE00003293243 +AGAGCATGGCCCGGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAG +>ENSE00001239803 +CTCAGAGCATGGCCCGGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAG +>ENSE00003475992 +GTACTTCAACTCCCGCCCCCACCTGTGTCCCGCTGGCTCCTAAGCTGCCCCCCTACGTGTGGGTTGCGTCTGAGATGTGGGGCAGGCGCCACTCACGGAAAAAAGGCATCAGAGGAGCTTCCACATCATCGGAACATTTTATTCCTCAGGACGCTACACGCTCACTTTCCTGGCGGAGCAGGTCAGTGCATCGAGTTCTGTTTCCGTGGAAAATGTGCACCTTGGAAACCGCATGACAGCCCCCTCGGCAGGGTCCCCGCGGATCCGCCGCGACGCAGGCACAGCAGCAAGTTCCTCCAGCACGAAGCTGGCCTGCCCGGGCCCAGGTGTGAGGGACTGTTCTGCTCCCAGCAGCGCCCGCTGACGCTTCCCTCTGCGGTCTCGGCGCAAGCGTCTGTCCCTGGCCGCCCTCGGAGCCGTGCCCAGCCTGGCATGCATATGCGGTGGTTAAGGATACAGTTAAAGGGTCAATCACGCGTGTCCACGACAGAGACGCACGCGGCCTCACACCGACTCCTCGGTGGACAGCAATAATGGGTTGATATACTCAAAGCCTTCGAACTCTGACTGGTCGATCCTCTTTATGGCATCCCTGTGGGCAAAGGTGGCAGGGGGGAGGGGGGTGACCGTGTGTTCATTCCCTTGGGGGAAGCGGAGTCACGTTCGCATAAGAATCCTCCCCCAACGCCCACTGGAGAGATGACACCAGGCGGGTGGGACTCAAGGGCAGGCTGGGTCACCAGCTGCCCAAGGTGCCGGCCTGCCATGGGGCTGCCCGAGGGGTGCTCCAGGGACCCGCACCCAGTGGGACTCACTCATCGTCTGGGGTCAGCTGCACGGGCTCGCTGGTGAACTGTGTGTCAAAGTTGTCCAGACCGTAGTCGTCTGTGATCTGTGGCTGGAATGGAGGGAGCGCCTGCTTCTTCTCCAGCTTGGAAAAACAATAGGAGAAGGGTCAGCTCCGCGCGGGCATCATCCCTACCAGATTGAGTGTTTTGCACGCACTTCAATCACAAAATGAAACAGTGAGAAAGTCAGCATTTCAATCTGCCT +>ENSE00001817609 +GTACTTCAACTCCCGCCCCCACCTGTGTCCCGCTGGCTCCTAAGCTGCCCCCCTACGTGTGGGTTGCGTCTGAGATGTGGGGCAGGCGCCACTCACGGAAAAAAGGCATCAGAGGAGCTTCCACATCATCGGAACATTTTATTCCTCAGGACGCTACACGCTCACTTTCCTGGCGGAGCAGGTCAGTGCATCGAGTTCTGTTTCCGTGGAAAATGTGCACCTTGGAAACCGCATGACAGCCCCCTCGGCAGGGTCCCCGCGGATCCGCCGCGACGCAGGCACAGCAGCAAGTTCCTCCAGCACGAAGCTGGCCTGCCCGGGCCCAGGTGTGAGGGACTGTTCTGCTCCCAGCAGCGCCCGCTGACGCTTCCCTCTGCGGTCTCGGCGCAAGCGTCTGTCCCTGGCCGCCCTCGGAGCCGTGCCCAGCCTGGCATGCATATGCGGTGGTTAAGGATACAGTTAAAGGGTCAATCACGCGTGTCCACGACAGAGACGCACGCGGCCTCACACCGACTCCTCGGTGGACAGCAATAATGGGTTGATATACTCAAAGCCTTCGAACTCTGACTGGTCGATCCTCTTTATGGCATCCCTGTGGGCAAAGGTGGCAGGGGGGAGGGGGGTGACCGTGTGTTCATTCCCTTGGGGGAAGCGGAGTCACGTTCGCATAAGAATCCTCCCCCAACGCCCACTGGAGAGATGACACCAGGCGGGTGGGACTCAAGGGCAGGCTGGGTCACCAGCTGCCCAAGGTGCCGGCCTGCCATGGGGCTGCCCGAGGGGTGCTCCAGGGACCCGCACCCAGTGGGACTCACTCATCGTCTGGGGTCAGCTGCACGGGCTCGCTGGTGAACTGTGTGTCAAAGTTGTCCAGACCGTAGTCGTCTGTGATCTGTGGCTGGAATGGAGGGAGCGCCTGCTTCTTCTCCAGCTTGGAAAAACAATAGGAGAAGGGTCAGCTCCGCGCGGGCATCATCCCTACCAGATTGAGTGTTTTGCACGCACTTCAATCACAAAATGAAACAGTGAGAAAGTCAGCATTTCAATCTG +>ENSE00003589214 +GTACTTCAACTCCCGCCCCCACCTGTGTCCCGCTGGCTCCTAAGCTGCCCCCCTACGTGTGGGTTGCGTCTGAGATGTGGGGCAGGCGCCACTCACGGAAAAAAGGCATCAGAGGAGCTTCCACATCATCGGAACATTTTATTCCTCAGGACGCTACACGCTCACTTTCCTGGCGGAGCAGGTCAGTGCATCGAGTTCTGTTTCCGTGGAAAATGTGCACCTTGGAAACCGCATGACAGCCCCCTCGGCAGGGTCCCCGCGGATCCGCCGCGACGCAGGCACAGCAGCAAGTTCCTCCAGCACGAAGCTGGCCTGCCCGGGCCCAGGTGTGAGGGACTGTTCTGCTCCCAGCAGCGCCCGCTGACGCTTCCCTCTGCGGTCTCGGCGCAAGCGTCTGTCCCTGGCCGCCCTCGGAGCCGTGCCCAGCCTGGCATGCATATGCGGTGGTTAAGGATACAGTTAAAGGGTCAATCACGCGTGTCCACGACAGAGACGCACGCGGCCTCACACCGACTCCTCGGTGGACAGCAATAATGGGTTGATATACTCAAAGCCTTCGAACTCTGACTGGTCGATCCTCTTTATGGCATCCCTGTGGGCAAAGGTGGCAGGGGGGAGGGGGGTGACCGTGTGTTCATTCCCTTGGGGGAAGCGGAGTCACGTTCGCATAAGAATCCTCCCCCAACGCCCACTGGAGAGATGACACCAGGCGGGTGGGACTCAAGGGCAGGCTGGGTCACCAGCTGCCCAAGGTGCCGGCCTGCCATGGGGCTGCCCGAGGGGTGCTCCAGGGACCCGCACCCAGTGGGACTCACTCATCGTCTGGGGTCAGCTGCACGGGCTCGCTGGTGAACTGTGTGTCAAAGTTGTCCAGACCGTAGTCGTCTGTGATCTGTGGCTGGAATGGAGGGAGCGCCTGCTTCTTCTCCAGCTTGGAAAAACAATAGGAGAAGGGTCAGCTCCGCGCGGGCATCATCCCTACCAGATTGAGTGTTTTGCACGCACTTCAATCACAAAATGAAACAGTGAGAAAGTC +>ENSE00001635485 +GTACTTCAACTCCCGCCCCCACCTGTGTCCCGCTGGCTCCTAAGCTGCCCCCCTACGTGTGGGTTGCGTCTGAGATGTGGGGCAGGCGCCACTCACGGAAAAAAGGCATCAGAGGAGCTTCCACATCATCGGAACATTTTATTCCTCAGGACGCTACACGCTCACTTTCCTGGCGGAGCAGGTCAGTGCATCGAGTTCTGTTTCCGTGGAAAATGTGCACCTTGGAAACCGCATGACAGCCCCCTCGGCAGGGTCCCCGCGGATCCGCCGCGACGCAGGCACAGCAGCAAGTTCCTCCAGCACGAAGCTGGCCTGCCCGGGCCCAGGTGTGAGGGACTG +>ENSE00003459358 +CCACCAGCCGCACAATGGGGTGGAGCGGCCCCTGAGTCATGGAGGCCTGGGGTCTCTGCGCCTGGCCAAGAGGGCTGCGTGGCAATTTCCACACCTGTGCACCAGGCCTCACTCAGAGGCATGAGGTGGCGCGACCCCCTCTCCCAGGGAGCTCAGAAGACGGCTCTGCCACACCTGACACCTGGCAGCTGGCAGCCCTGCCTCTAGGAAGCCTCAGCTCTGGACAGCTGTGCCTTCACCTGAGGG +>ENSE00003626371 +TCTTTCATGGATGTGCAAGACTTTGAATGACCCTGGCAGTCAAGGGTGAGTGTCATCCACAGGAGAGCCGGCCAGCCACGGGCTCCATGGGCAGTTGCCCCGCACCACGCCCACGCAGGCCCACTGTGCAGCCCCCAAGTCACCAGAGTTTTCGAGAACCACTTCCAAAAGACACCGTCGTGACCGGAGCCATTAGCAAATATCAGGATTTTTCAAACCACACTTCAATACATCCTTCACTTTAATTTATAAAACAAATTACTGAATATAAAAGTCTCCCCTCTGATGAGCACAGCATTACTCACATATTGTGTACAAGAACGGCCAAACTGGTAACCGGCACGCTACTGGCAACACGGCAGTATTTAG +>ENSE00003526713 +TCTTTCATGGATGTGCAAGACTTTGAATGACCCTGGCAGTCAAGGGTGAGTGTCATCCACAGGAGAGCCGGCCAGCCACGGGCTCCATGGGCAGTTGCCCCGCACCACGCCCACGCAGGCCCACTGTGCAGCCCCCAAGTCACCAGAGTTTTCGAGAACCACTTCCAAAAGACACCGTCGTGACCGGAGCCATTAGCAAATATCAGGATTTTTCAAACCACACTTCAATACATCCTTCACTTTAATTTATAAAACAAATTACTGAATATAAAAGTCTCCCCTCTGATGAGCACAGCATTACTCACATATTGTGTACAAGAACGGCCAAACTGGTAACCGGCACGCTACTGGCAACACGGCAGTATTTAG +>ENSE00001862783 +GAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGTGAGTAGGCCACCCCTGCGCCCGGCCCGGTTATCCATCCGTGTTTGGAAACCACAGCCGTTCAGAAGGTCAAGAGGTGGCCGAGCTCAGCGCTGGCTTTTAAAGCCCTGTTTCACACTGGAAAGGTGGCCCAGTGCTGTGGCCTGGCATGTCCAGGTGGCTCTCTGTCACGGGTCTGGGGTCCACCTGCTTGCCGTGCTCTGTGGGCAGGGCAGGCTGGGGGCCCACAGAACAGCACAGAAGGAAGGCTGGGAGCACTGGCCCCGGGTCCACCTGGCCATCCTGGAATCTGGTGGCACCAGCGTCCCCAGGCCCAGAGCACAGGAACACCTTCCCGAGAGTGCGTCATGGGTTTTAAAAATGAAGATCGTCTTTTTTGTCTGGAGATGCTTTTTCTTATTTTTGAAACCCAACGTATATTTTTATGTATTTTTTAAGTAAAGGGGAATGGAACCCAGTTTTGCTAACAAGATAACCCAAACTGCCCAGTGCCTGGCCTTGTGTCTGGCGACCTCTGGGCCCTTGGCCTCCGGAGCAGGTCCTGGGGCTGGGGTGGTGTGAATGATGCTGGTTCGTAACTTTTGGTTGAGTTAATGGGCGGCAGGTTTCAGAGCTTATGGAGACCAGGTCCTTCAGTCATGCCTGATGCCCCTGGTCTTCCAGAAGCAAAAACAGCTCGGGAATGCGAAGGCACCGGAGTCCAAAGTTGGCAGCCAACAACAACAACAACAAAAGAAAAGGCCGGGCACGGTGGCTCACGCCTGTAATCCCAGCCCTTTGAGAGGCTGAGGCAGGTGGGTTGCTGGAGCCCAGGAGTTTGAGACCAGCCTGGGCAACATGGCAAGATCCCATCTTTACATGCCTGGGCGTGGTGGCGCGTGCCTGTGGTCCTAGCTACTCTGGAGGCTGAAGTGGGAGGATTCCCTTGAGCCAGGAATTGGAGGCTGTAGTGAAGTATGATTGCACCACTGCACTCCAGCCTGGGTGACAGAGTAAGACCCTGAATCACGGACAGAGGGTACTGTTGGGAGCCCTGGGGAGAAATCCATGCTCTTGGCTGAAGCTCTGAGATCCTTGTTGCTGTCAGGGTGCTGCCCCCCGCCCCCCGGGGAGGGGCTTTTGTCTTTGCATCGCCTGCTTTTCCAGATAGTCTAAAAAAAGACTTCTGAAGACAAGGACGTTCACGAGGAAAAACTTGCCATTTTGAGCTTTTTAAGCAGTTGCTGAAAGCTTGGCAGACTGCCTCAATTTTTCCTAAGTAGGCGTCAATGAAGTCAGGTCCAGGCCTTGGTGTGTCTGGAATGCTTCAAGCACATTCGAACACTTGATCGTAAGGGAGAGCCGGTACTTTGGAACCGGAACTCACCCGAGGCTGTGGCCACCGCATGGGCAGGCTAGCTGGGGGACAAGCCCCATATCTTTGGGAACAAGGGTTTGCACAGCCACCCTGGGATGCCCTGGGACTCCTGACCGCACAGGACCCCAGCAGGGAGGCCGCCTGGATTGGAGGGTCTGGTCTAACAGCCGGACTTGGTCTTGAACCGTCGCCCTGTCCCGCACAGGCGCCTGCTGAGCCTGGAGCCCTGGCAGAGGCGGGTCTGGGGAGTGGAGCTGCCAGGAGGCCTCCCATTTCTCACAGCCTTGGTGTTCTCCGGGTCACCCAGAGGACCGTCAAATGCTGGATTTGACAAACTATGTAGAATGTTCTTTGTGTCTTTAAGATCTTCTTGTGGTCCTATTTGGACATTTTGTGCATTTTCAGACACCTGCGGGTCACGTGGGTGGATGGGAAGCTGGGCACCTGGTGAGGGGTGAGGATGTTGAGAGCCAGAGCTGCGTTTTGTCTCTGTTGATGTGGCGAGGCCCTGGGTTGGTCACTGGGATTTTTTTTTTTTTTTGAGACGGTGTCTCGCTCTGTCGCCCAGGCTGGAGTGCAGTGGCATGATCTCGGCTCACTGCAACATCTGCCTCCCGGGTTCAAGCGATTCTCCTGCCTCAGTCTCCTGAGTAGCTGGGATTACAGGCGTCACCACACCTGGCTAATTTTTGTATTTTTAGTAGAGACAGGGTTTCACCATGTTGGTCAGGCTGGTCTTGAACTGATCTCAGGTGATCCGCCCGTCTCGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGCGCCCGGCCGGTCGTTGGGATTTTAACAGCCCTGAGGCCCCTCACGCTGCCAGGTGCCAGCCCACCCTGCAGCCCTGCTCCCCTGCCCACACGCAGAAGCCACCAGAGGCTTCTGGACTGAGCCCCCACTGTCCTGCAGCCGGGCTGGCCTGTCCACACCACAGGGCGTGCTCAGCTACTGAGCAGAAGCGTCACGGACAGGGCAGATCAGGCCAGGACAAAGCTCTTCCGCCACAGGCGGGGGTCTGAAGGCATCTCAGAGGGCCCCCAAACAAGGGACGCTGCCTGGAAACCCCGGGACAAGATGACCTCGGTTCAGATCTTAGCACCTTCTGGCAACCTTAGAGAAAGCTTCTGGAGGGAGGGGCTGGTTCCCAGGATGGGCAGAAGCCGGAAAGTCTCAGACTGAGTGACCCTCGGGGGCTTCAGAAGGCACTGGGTGGGCTCTGCCAGAGTGAGAAGGCAGCTGATGGCTGCTGGAGCCAGCCCCGGGAGTGGGGGTCCAGCTATGGTCTGGAGAGGGGGACTTGAGGGTTGCAGTGGCCACACAGACGGGGCACAGGAGCCAAAGGAAGGGACACAGCAAAGCCCAAGGGTAAAACGGCGCGCCGTGGACTGGTCTGAGGGCAGAGGCTGTAGGGGAGCGAGGGGCGGTGTGGCTGACAGGTGGACACAGGGACACGTGTCCTGTGGACTTGGCCGCTCAGTGGGGGTGTGTCCCCCAGCAGTGGCGTGTGAGGGATGGTCACTCTGATGGGACACTGACCACTTGGCCTCCAGCAAGATCTAGGCCCAAGTCTAGGCTGAAGCCGCCCACTCAGCCCCGGGACATCGTCCCCGGCAGCTCTGCTGAGCACGCCAGCTCCGGCACTCTCCGGGAGTCATGGCCGGAAGTCAACTGTCCTGGCTTCCAGGGCCACACCTTGGCCAGGCCTGGTGATGGTCATTTCCAGCCGCTCCAGTTGGGCTGATGGGGCCACATGAGGCCGGGGATAGAAGGTGGCTGCGCTCAGACACCCCTCCCGGCCCCACTGGATGCCCAGGGCGCTGACCTGCAGGACTCGGATGGGTTTTCTCCTGCCACCCCTGCCTGGCCGGCCACCATCCCAGCGCCAGCGCCCTCCTGAGAGGTGCAGGGGCCGCGTGGGGCCTCCCAGAGTGGCAGGTTGGCAGCCTGCACGCCGGTGACGGCGTCCTTCTCCGTGGTGAGGCTTGGTCCCTCCTCGCCAGAAACACCAATTCTCTGACGTGAGCTGCACATCCACTGCCCAGCCATGTTTACTCTTCTGCCTCCTGTAGACGCAGCCGCGGCGGCTCTCCCTGGCAGGCCACCCGCCGTCCTGCCTTTTCTCCGGGTCAGGCCGCCTGTCTGCCGGGCTCCACGATGAGCGCGTTCTCAAGCTGAGCAGGCGCCAGAATCCCATAGAGAGGCTTGTTGAGACACAGCTTCCCCACCCCCAGCTCGGACGCAGGGGCCTGGCGTGGCCTCCTCACGGGCACGGTGTGGAAACACCACTGGCGGTTACCGTGGTCTGCCGGGTGCATGAGCCCCTGGGGTGGCCCCGTCCCTTGTTTCTGACCAGCCGGATCCTCTCCAGCGGCAGGAGCAGAGAGGGCCCGGAGGTCCAGACGGTGCTCTCTGCGGCCAGCATGCCGCGGAGGTGGCCGAGTGAGTGTGGCCCCTCCCTTGCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTCTGTCTCTGTGTTGTGATGAAACGTC +>ENSE00003569320 +GCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTCTGTCTCTGTGTTGTGATGAAA +>ENSE00003681657 +GCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTCTGTCTCTGTGTTGTGATGAAA +>ENSE00003483048 +GCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTCTGTCTCTGTGTTGTGATGAAA +>ENSE00001951400 +GCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTC +>ENSE00002033745 +GCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGC +>ENSE00003636009 +GCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTG +>ENSE00003529933 +GCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTG +>ENSE00001602311 +AAGCAAAAACAGCTCGGGAATGCGAAGGCACCGGAGTCCAAAGTTGGCAGCCAACAACAACAACAACAAAAGAAAAGGCCGGGCACGGTGGCTCACGCCTGTAATCCCAGCCCTTTGAGAGGCTGAGGCAGGTGGGTTGCTGGAGCCCAGGAGTTTGAGACCAGCCTGGGCAACATGGCAAGATCCCATCTTTACATGCCTGGGCGTGGTGGCGCGTGCCTGTGGTCCTAGCTACTCTGGAGGCTGAAGTGGGAGGATTCCCTTGAGCCAGGAATTGGAGGCTGTAGTGAAGTATGATTGCACCACTGCACTCCAGCCTGGGTGACAGAGTAAGACCCTGAATCACGGACAGAGGGTACTGTTGGGAGCCCTGGGGAGAAATCCATGCTCTTGGCTGAAGCTCTGAGATCCTTGTTGCTGTCAGGGTGCTGCCCCCCGCCCCCCGGGGAGGGGCTTTTGTCTTTGCATCGCCTGCTTTTCCAGATAGTCTAAAAAAAGACTTCTGAAGACAAGGACGTTCACGAGGAAAAACTTGCCATTTTGAGCTTTTTAAGCAGTTGCTGAAAGCTTGGCAGACTGCCTCAATTTTTCCTAAGTAGGCGTCAATGAAGTCAGGTCCAGGCCTTGGTGTGTCTGGAATGCTTCAAGCACATTCGAACACTTGATCGTAAGGGAGAGCCGGTACTTTGGAACCGGAACTCACCCGAGGCTGTGGCCACCGCATGGGCAGGCTAGCTGGGGGACAAGCCCCATATCTTTGGGAACAAGGGTTTGCACAGCCACCCTGGGATGCCCTGGGACTCCTGACCGCACAGGACCCCAGCAGGGAGGCCGCCTGGATTGGAGGGTCTGGTCTAACAGCCGGACTTGGTCTTGAACCGTCGCCCTGTCCCGCACAGGCGCCTGCTGAGCCTGGAGCCCTGGCAGAGGCGGGTCTGGGGAGTGGAGCTGCCAGGAGGCCTCCCATTTCTCACAGCCTTGGTGTTCTCCGGGTCACCCAGAGGACCGTCAAATGCTGGATTTGACAAACTATGTAGAATGTTCTTTGTGTCTTTAAGATCTTCTTGTGGTCCTA +>ENSE00001720216 +AAGCAAAAACAGCTCGGGAATGCGAAGGCACCGGAGTCCAAAGTTGGCAGCCAACAACAACAACAACAAAAGAAAAGGCCGGGCACGGTGGCTCACGCCTGTAATCCCAGCCCTTTGAGAGGCTGAGGCAGGTGGGTTGCTGGAGCCCAGGAGTTTGAGACCAGCCTGGGCAACATGGCAAGATCCCATCTTTACATGCCTGGGCGTGGTGGCGCGTGCCTGTGGTCCTAGCTACTCTGGAGGCTGAAGTGGGAGGATTCCCTTGAGCCAGGAATTGGAGGCTGTAGTGAAGTATGATTGCACCACTGCACTCCAGCCTGGGTGACAGA +>ENSE00003630334 +AAGCAAAAACAGCTCGGGAATGCGAAGGCACCGGAGTCCAAAGTTGGCAGCCAACAACAACAACAACAAAAGAAAAGGCCGGGCACGGTGGCTCACGCCTGTAATCCCAGCCCTTTGAGAGGCTGAGGCAG +>ENSE00003481862 +GAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAG +>ENSE00003510741 +GAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAG +>ENSE00003548540 +GAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAG +>ENSE00003634783 +GCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAG +>ENSE00003467961 +GCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAG +>ENSE00001841545 +CTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAG +>ENSE00001816369 +GCCCCAGGCCCTCCCGGGTCTCCCCACCATAGCGTTTCCGCTACTGAGTACCCCCTGTCTGCCCTCTCTGTCTGCCCCAGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAG +>ENSE00003618179 +GGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGG +>ENSE00001545345 +TGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGG +>ENSE00001822711 +TCACTTCCGCCCGGCGCGGGCTTGGATGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGG +>ENSE00002226200 +CTCACTTCCGCCCGGCGCGGGCTTGGATGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGG +>ENSE00001477870 +GATGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGG +>ENSE00001816144 +GGATGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGG +>ENSE00001720995 +CGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGG +>ENSE00002040955 +CGGGGTTTCACTATGTTGGCCAGGCTGGTCTAGAACTCCTGACCTCAAGTGATCTGCCCGCCTCGGCCTCCCAAAGTGCTGGGATTGCAGGCGTGAGACACTGCACCCGGACAATTTTCCTTTTCTTACAAGAACACTGCTCACACTGCATTCAGGGCCAACCCTAACCCAGTATCGCCTCATCCTGGTTTGATTATATCGGCACAGACCTTGCTTCCGAGCGAGGCCACTTTCTCAGGTACTGGTGGACATGAGTCTTCGGAGACGCTGCTCAACCCACAGTGCTCCTCCAGCTTGGTTTCTGTGACTTGCCTTCCCCAGAGGAGGGGTGCCCTGAGAGGTCTCCACTCCCTGACCGGCTCCTTGGTGCCGCGCACTCTGAGAGGCTTCCCAGGGAACAGAGCACACAGGACCGCCCTCCTGGGTAGACCAATCAGCATCTGAGCTCACAATTTCCCAGCAGGGCAGTGGGGTGGAGAGAGAAGCCTGGGCTGGGCTGGGCTGGGCTGGGCTGGGGAAGCTTCTCCGGGCGGGGGGACGTCAGAGCAGGATCTGGGGCTGATAAAAGCCCGCCCCTGGGTGGGGGCTGAGTGGTGCGGAAGCTGAGCCCGACACGTGGGGATGGAGGACAGGCTGTGGGAGGGTGTGAACCGGATACTGCTTGAAGGGGTGCTGGGGACTTTGAGAGAGGGCGGCTGGCCCTGTCTGGTCGGGGATGCTGGCCCAGACACAGGCCATGGCTGGGATGGGGTTCAGAAACAGGACCGCTGTCTCTCCCGGGCCAGGGCCCTCCCCAGCTGCTCCTGGCTTTCTGGTTCTTGGGGTCAGGGGCAGGCCTGTGCCATGACCCCGCCACTGAGGCTGTGAGGAGGCTGTCGGTGCCCAAGGGCACCAAGGCACACCCCTACTCTTGCACCCCATGTGTGGGCCCGAGCACCTGCTCTGCTGCCCCAAAGATCTGGCGATGTTTCCCAGGCAACTGTCTCTCACAGCCTGTCTGCCTGGCACTCCCGTATCCCATAAATGCCACCACATCTGGCTATGGGTGGGCGTGCCTGCCTGGCATCCACGGGCCAGCAGGTGTGGTGGAGCACAGCCCAGTTCCTGGCTGCGTCAGAAGGCTGCCCGGGCCTTTTGGCTGTCCTTGCCAGCAGGTGAGCACTGCCAGGGCACCGTGTGTGGGTGCTGGGCCATTTAGCCACATGGGAAGGGGTGGAGGCAGCCCAGTGCCTTCAGCATGTGCCCAGGGTGCCTGTCGGCCACAGGTCTCATTTGGAAATTGGGAGGGTGCACGGCCACCGGGCTGCTTAGGCCTGCCAGCCTCAGGGCCCGTCACCGCTGTCTTAGCCTGATTTGCAGGGTGTCAGCGCTGGGCAGAGATGAACATTTGGGTGACTCTGAGGATGCCAGTGGCTGGGACACTTGTTCTTCCGCGGTGGAAGGAGTTGGAGAGGCCTGGCTCCCTGACCTACGGCCAGCCTGGCTTCTGAAACCAGCTCAGTGGGCTGGGGCCTGATTCATCATCCATAAATGTGTCCTTTTTTGCCACAGAGGGTAAGGGGCCTCCTAGCCCACCGGTCTGCAGGTGCGGGAGTAGGAGATGGGTGGCTCTGATGCCCCCACCCACTCGATCACCTTCTGCTCTGCCTGGGATGCAAACTCCCACAGCTGAAACGTTCTTTTGTAAACATGAATTTTGGCTTAGAAAAAACTCATTTCCACTGTGCACGTGTCAGTCCCAACCAGAAATTATTTTCCAATAAAGCAAAACTCCGTCACCACAGCAGCAGATGGCTCCGAAGAAGTGGAGCGTTTTCATCAGGTTCAACTTTGAAACCTCCACCATCACCATCACCAGCACCGCTGTGTCATGCTGATAACTTGAGGACAGGCAGGACAAG +>ENSE00003615416 +CAAAACTCCGTCACCACAGCAGCAGATGGCTCCGAAGAAGTGGAGCGTTTTCATCAGGTTCAACTTTGAAACCTCCACCATCACCATCACCAGCACCGCTGTGTCATGCTGATAACTTGAGGACAGGCAGGACAAG +>ENSE00002044438 +CAAAACTCCGTCACCACAGCAGCAGATGGCTCCGAAGAAGTGGAGCGTTTTCATCAGGTTCAACTTTGAAACCTCCACCA +>ENSE00001853635 +GGGCAGCGAGGGAGGCGTTGGATGGAGCCACCCCACGGCTCCTCTGTGAAGGTCTGCACGTCACTCAGAAAGTTGAAGCAAACCAAGCAGGGTTGGAGCCCACAGTTCACAGCCGGCTGCACAGGGGATGCACCAAGCACAGTTTCCTATGACAAGTGGAAACCTGTGCGCCACAGGTGAGCTGGGTCCTGGAAGGTGCAGGGACCAGGCAGCATCTCATCTCAGGACATCAAGGGCTGTCCCCAGCCAGCAGATTTCCCATAAAAACGTGCTGAACTGGGGACAAAGCTGATTCTACAGAGCCGAGAAGCCAGACCTTCCCTGGGGACTCCCGAGGGGGTCCCAGCCACCCTCTCCACCTGCAGAGGTTTCCTGGCCCACTTGGAGGACCTTGGGGGATCCTCCAAGGGCCCCCTTCCAGCTCTTGGCCCATGGGGGAGCCTCTTCCTCAGCTCCGGGTGTGGTGGACAGGAGACCGAGGGCTCCCCGCACCCAGCTGGGCTCAGCGTTTTCAAGCTGAACTTGGTGCGTGGCGGCTTGGAAAGCCGGGAGCCTGCTGCGTGTCTCCTGGGGCTGCTGTGAAAAAATGACCACACACTGGGAGCCTAAAACGAGTGACATGTATATTCTCACAGTTCAGGCAGCTGGTGTCCAAAATCAGTGGTTGGGAGGGTGGAGCTCCGCCTAAAGGCTCTGGGTGGCTGCTGCCTGCCCCTTCCAGCCCCGGGCCCCCGGCATTCCCTGGCGTGCAGCTGCTCCACCCCCAACCCCAAAGCCTCCTTCCTGTGTCTCTGTGTCCAAATTTTCCTTACCTTTTTTTTTTTTTTTTTGAGATAGAGTTTTGCTCTTGTCGCCCAGGCTGGAGTGCAACAGCACGATCTCGGCCTATCGCAACCTCCGCCTCCTGGGTTCAAGCGATTCTCCTGCCTCAGCCTCCTAAGTAGCTGGGATTACAGGTGCCCACCACCACACCCAGCTAATTTTGTATCTTTAGTAGAGATGGGGTTTCACGATGTCTTTCAGGCTGGTCTCGAACTCCTGACCTCACATGATCCACCTGCCTCGGCCTCCCAAAGTGCTGAAATTACAGGCATGAGCCACAGCACCTGGCCAATTTTCCTTTTCTTTCTCTCTCTCTTTTTTTTTTGAGACGGAGTCTTGCTCTGTTGCCCAGGCTGGAGTAAAATGGCACAATCTTGGCTCACTGCAACCTCTGCCTTCTGGGTTCAAGCGATTCTCCTGCCTCAGCCTCCCGAGTAGCTGAGACTACAGGCGCCCACCACCACACCCAGCTAATTTTTGTGTTTTTTAGTAGAGACGGGGTTTCACTATGTTGGCCAGGCTGGTCTAGAACTCCTGACCTCAAGTGATCTGCCCGCCTCGGCCTCCCAAAGTGCTGGGATTGCAGGCGTGAGACACTGCACCCGGACAATTTTCCTTTTCTTACAAGAACACTGCTCACACTGCATTCAGGGCCAACCCTAACCCAGTATCGCCTCATCCTGGTTTGATTATATCGGCACAGACCTTGCTTCCGAGCGAGGCCACTTTCTCAGGTACTGGTGGACATGAGTCTTCGGAGACGCTGCTCAACCCACAGTGCTCCTCCAGCTTGGTTTCTGTGACTTGCCTTCCCCAGAGGAGGGGTGCCCTGAGAGGTCTCCACTCCCTGACCGGCTCCTTGGTGCCGCGCACTCTGAGAGGCTTCCCAGGGAACAGAGCACACAGGACCGCCCTCCTGGGTAGACCAATCAGCATCTGAGCTCACAATTTCCCAGCAGGGCAGTGGGGTGGAGAGAGAAGCCTGGGCTGGGCTGGGCTGGGCTGGGCTGGGGAAGCTTCTCCGGGCGGGGGGACGTCAGAGCAGGATCTGGGGCTGATAAAAGCCCGCCCCTGGGTGGGGGCTGAGTGGTGCGGAAGCTGAGCCCGACACGTGGGGATGGAGGACAGGCTGTGGGAGGGTGTGAACCGGATACTGCTTGAAGGGGTGCTGGGGACTTTGAGAGAGGGCGGCTGGCCCTGTCTGGTCGGGGATGCTGGCCCAGACACAGGCCATGGCTGGGATGGGGTTCAGAAACAGGACCGCTGTCTCTCCCGGGCCAGGGCCCTCCCCAGCTGCTCCTGGCTTTCTGGTTCTTGGGGTCAGGGGCAGGCCTGTGCCATGACCCCGCCACTGAGGCTGTGAGGAGGCTGTCGGTGCCCAAGGGCACCAAGGCACACCCCTACTCTTGCACCCCATGTGTGGGCCCGAGCACCTGCTCTGCTGCCCCAAAGATCTGGCGATGTTTCCCAGGCAACTGTCTCTCACAGCCTGTCTGCCTGGCACTCCCGTATCCCATAAATGCCACCACATCTGGCTATGGGTGGGCGTGCCTGCCTGGCATCCACGGGCCAGCAGGTGTGGTGGAGCACAGCCCAGTTCCTGGCTGCGTCAGAAGGCTGCCCGGGCCTTTTGGCTGTCCTTGCCAGCAG +>ENSE00001859055 +GGGCAGCGAGGGAGGCGTTGGATGGAGCCACCCCACGGCTCCTCTGTGAAGGTCTGCACGTCACTCAGAAAGTTGAAGCAAACCAAGCAGGGTTGGAGCCCACAGTTCACAGCCGGCTGCACAGGGGATGCACCAAGCACAGTTTCCTATGACAAGTGGAAACCTGTGCGCCACAG +>ENSE00002034769 +CCGCTCACTGTCATGACAAGTGGACAGATGCCCCGGGCCTCAGTTGACCCATCTGTAAGTGGGGCCACGCGACAGCACCTCTGTCACAGGGCTGGGTGTGGGGTGAACAGGCTGGTCCCTGGAGGCAAGTAGTGTGGTGCCCTGAGGCCTGAGGCCAGGCTCCAGGACCGCTCAAGGAACAGGGGATTTGAGGCAACTCAGAGAGGACAGGCCCAGCAGCCGGCCCCAGCCTGATATCTTCCCTCCGCTCAGGCCCCAGACGCAGCTGCATCCTGGAGTCCTTCTGAGAAATGTGGGACCTGCCCCAGCTCCACCCCAGGTGAGGGGCACCAGCCAGCTCCAGAGCTGCCTACCTTCCCTGTCAGGTGCACAGGTCAGCGCCAGGCCAACCCCAGAGCGAGAACACCTGTGCTGGACTGAGCTGGAGCAGCAGGGTGGCCTGCACCG +>ENSE00001916683 +GCCCCAGACGCAGCTGCATCCTGGAGTCCTTCTGAGAAATGTGGGACCTGCCCCAGCTCCACCCCAGGTGAGGGGCACCAGCCAGCTCCAGAGCTGCCTACCTTCCCTGTCAGGTGCACAGGTCAGCGCCAGGCCAACCCCAGAGCGAGAACACCTGTGCTGGACTGAGCTGGAGCAGCAGGGTGGCCTGCACCG +>ENSE00001937728 +GCCCCAGACGCAGCTGCATCCTGGAGTCCTTCTGAGAAATGTGGGACCTGCCCCAGCTCCACCCCAG +>ENSE00001845014 +CCCAGGGCGTCTGTCACAGCTTTCCAATCCATGAGCCCATCAATCGGACTGGACACAGATAAACTGGGACAGGACGCCGGGTGGCAAAGGCCGGGAGAGCTGGGCCACTCCCTCCAAAAG +>ENSE00001908868 +TAGAGACAGGGTTTCACCGTGTTAGCCAGGATGGTCTCGATCTCCTGACCTCGTGATCCGCCCGCCTCGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCACGCCCGGCCCCCAGAGCCTTAGTCTCAGAATCACACCCACCCCACG +>ENSE00001934415 +CTTTTGTGGGGTCAGTGCCCACAGGGTTGAGCACCACGTGCCTGGCTGGGCAGTGCTCCTGCCAGGGTCCCCTTCTCCACTGTAGGAAACACGGCTGCTCCTGCAGCCGCGTCTGCTCTGCTGCATCTCCAGCTCCTGCCAGGCATGGTGTGCGCGGCCCCAAGACAGGGAGTTTCCA +>ENSE00001714381 +AGATCCAAGGCCTGTGGGCCACGGCTGCGCCTCTCCTGACTCCAGCTTGCCCGTCTGTCCTTGGGGGCAGCGTCCTTCCTTCTCTCGGCCCCTTGGAGCAGCTCTGCGGGAACCCCACAGCAGCCCAGCGGATTGAACGCAAAAGACAGCCACCCTCCTGCTCCGGATCCTGGGAGGAGGCTACACGCTGGCGCTGAGACAGCAACCTGCCTGGCCTGGGAAGCCCCCCGCAGCCCCTACATCAGAAGCTTGCTCTTGGCGCAGTGGCTCACGCCTGTAATCCCAGCA +>ENSE00001821386 +AGATCCAAGGCCTGTGGGCCACGGCTGCGCCTCTCCTGACTCCAGCTTGCCCGTCTGTCCTTGGGGGCAGCGTCCTTCCTTCTCTCG +>ENSE00001724829 +CCTTTCCTGCCGCCCAGGCCTTGGAG +>ENSE00001927358 +GAACATGGATGCCTCGCTTTTCAGAGACTCGCGTTCTTGGAACTTACACCCTTTTGGGTTTGCTATTTTTACCCACCCTGAGCCTTCCGGTCTCCATGGCGACGCCTCCAAACAGCAGATTCCAGGCGGCAATGACGTCATCTCTCCCTTTCCTGCCGCCCAGGCCTTGGAG +>ENSE00001755234 +ACAACATTCCCAATGCCGTCTGGGTCTGGGACATTCAGAAGCTGAGGCTGTTCGCGGTGCTCGAGCAGCTGTCCCCAGTGCGCGCATTTCAGTGGGACCCGCAGCAGCCGCGGCTGGCCATCTGCACGGGAGGCAGCAGGCTCTACCTGTGGTCCCCAGCGGGCTGCATGTCGGTGCAGGTGCCTGGGGAAGGTAAGCACATCCCCGAGGCCACGGACGTGGCAGCCTTGCTGTGTGCAGTCTGGCATCACACGGGCTGAACTGTTGAAGCCCAGCTGCTGTCTCCGGCAGCACTCCAGGGAAACTGCCCTCAGAGTCTTTGCGTAAACCTCAAGACGGACACACAGGGGACCCGCTGCCCTCAGCTTTATGGGCTAGAAGCAGCCTCTCCCTGACTTGAGGCAGCTCTGGGGCTCCACCCTGGCTCTGCCTATGTGGGTCACTCCAGGCACTGTGCTGGCCTGCAGGACAAGGGGGTGCCCATCCCCCAGAATCTGGGCCTCCCCTGCTGTAATCCTCTGGCCACCTGTCTCTCTCTAGGCGACTTTGCAGTGCTCTCTCTGTGCTGGCATTTAAGCGGAGACTCGATGGCCCTCCTCAGCAAGGATCACTTCTGCCTCTGCTTCCTGGAGACAGAGGCAGTGGTCGGCACAGCCTGCAGACAGCTGGGCGGCCACACGTAGCAGCGGTGCACTAACGTGTGCAGAAACAGGGCTACTCTGTGTTTCCAGTGTGGGAAAAAACACAGCTTCACCAGGAGGTTCTCCACTGTGGTGGTCTGGATTCAGTGATTGATTCTATTTTTCTATAGCAAAGCATTTTTGTAAATATGTATGGTATAAAACTGTAGTTTTATTATTTAAAATAAATACTTGCTGATTTATACAACTA +>ENSE00001697450 +GCGACTTTGCAGTGCTCTCTCTGTGCTGGCATTTAAGCGGAGACTCGATGGCCCTCCTCAGCAAGGATCACTTCTGCCTCTGCTTCCTGGAGACAGAGGCAGTGGTCGGCACAGCCTGCAGACAGCTGGGCGGCCACACGTAGCAGCGGTGCACTAACGTGTGCAGAAACAGGGCTACTCTGTGTTTCCAGTGTGGGAAAAAACACAGCTTCACCAGGAGGTTCTCCACTGTGGTGGTCTGGATTCAGTGATTGATTCTATTTTTCTATAGCAAAGCATTTTTGTAAATATGTATGGTATAAAACTGTAGTTTTATTATTTAAAATAAATACTTGCTGATTTATACAACTA +>ENSE00001797222 +ACAACATTCCCAATGCCGTCTGGGTCTGGGACATTCAGAAGCTGAGGCTGTTCGCGGTGCTCGAGCAGCTGTCCCCAGTGCGCGCATTTCAGTGGGACCCGCAGCAGCCGCGGCTGGCCATCTGCACGGGAGGCAGCAGGCTCTACCTGTGGTCCCCAGCGGGCTGCATGTCGGTGCAGGTGCCTGGGGAAG +>ENSE00001862304 +GAATCACCTTCACCAGGGACGGCCGCTACATGGCGCTGGCAGAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGGTAAGGCGTCCCCCAGACTGGAATAAAGTTGTCCTGCTGACTGTGGAGGGATCGAGTGAAGTAGATCCTTCCAGATTCCAGGGGATCTTTGGTAGGATATGGAGCAAGGTGATGTTGTATTAACAAAGGGCAGGTGCGCTGCGAATCACTTCCAGTGGCACCCGGTTGTGTGTTCAGGAGACTTGGTGAAAAGGACGCGTGCCCAGGTGTTTTAAAAGTGAATATGCTGTCACATTTGAGCCCTTTTCCTTGTCCTGTGTGATGGTGTTTGCGCATGTGTGTGCCACGTCGGGAGTTGGGGGGACGTGGAAGTTCACCTTGACTGAGGGCCTGCATTAGGCAGGGCGCTCTGCCAGGTGCCCAGGCACAGAGGGCACTGCCCCCACAGCAGACATATGAACACGATTCCAGCACAATCCATCATTAAGGTAGAGCAACCTCTGGAATGCTGTCAGAGTGCAGAACCCGGGATCCAGGCAGTGCTCTGGAAGGGACTTGTCTGAGCTGGGTCTAAAGGAGTGAGCCTGGCCAGGCAAGGAAAGGTGAGGGGGAGAGTGTGCACATGAGTGCAGGTGCGGGGAGACCAAGCCACCTTCGGGGGCTGGCCAGGCAAGGAAAGGTGAGGGGGAGAGTGTGCACACGAGTGCAGGCGCGGGGAGACCAAGCCGCCCTCGGGGGCTGGCCAGGCAAGGAAAGGTGAGGGGGAGAGTGTGCACACGAGTGCAGGCGCGGGGAGACCAAGCCGCCCTTGGGGGCTGGCCAGGCACTGACGCTGGCATCTGTGGCGGTGCAGCCCCAGCAGCAGCTCTACAGGGATTTCATGCATTTCCAGGATAGAGCTGTTGAGATTTTGTCAATTTCTATATAAGGAAATTAAGTGCGTTAAGAACATCAGTCATAAATGCAATTATTTATTTACGAAAATATTTTCCAAATTTAATGTTTCCCCCCCTTCCTTTGGAAGCATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAGGTATGAAGATGACCAGGTGACATGTTTGCTTTCGAGAGCTTTTCCCGGAATTTCATGCTTTCTGAATGCTGCAATATAGTTTGCTTTATCTTATTTCAGATAACAAGTTGAGCTTTGTTTTAAAAGACAGGGTCTTGCTCTGTCACCCAGGCTGGAGTGCAGTGGTGTGATCACGGCCCACTGCAGCCTCGACCTCCTGGACTCAAGTGATCCTCCTACCTCAGCCTCCCAAGTAGCTGGGACCACAAGCATGCACCACCACGCCCGGCTAATTTTTGTATTCTTTGTAGAGATGGGGTTTCACCGTGTTGCCCAGACTGCTCTTGAACTTCTGTGTTCAAGTGATCTGCCAGCTTCGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACAGTGCCCGGCCGAGTTGAACTTTTATCAGCGAGCCATTAGGTTGACCTCCCAATTTCCCCTTTTTCCTCATGCTCTCACTGCCTCTCCGTGACTATCTCAGTACTAGCTGGCAGTTCCAGCTTTTCCACGGCCACGCGGACAGTCCTGCCAGCTTTGTGCTATCTGCACCAATGTCACTCTGCAGCACCCGCGTCTGTGGTGTGTTCCTGGCGACGGGGGTGTATTCATTATTAACTGAAATGTCTCATCTGCAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGGGAACCAGTGCAGGGCACTCAGGAAGTCCGACCGCCCAGCGGGCCGGGCCCTGCCTCACCTGTGCATGGTTTCCTTCCTCAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTAAGTCTGGAACACGTGTTTCTGCCTGAGCAGGCTGTTGGGGAGGGCGGTGGGAAACTGCTCCTTCACTTTGCTTTCTTGATTGTGGTTTATTATTTAACCGGGCACTTCCATCACCGTAAACTTGCTACTGTGACATTTCACGCGTCTGGCCCTGCCCTGGCCTTTGTTCTTCCTCCTCCACGCTGCCCAAAGGGTCTGAAGTGGGCCTTGCCCTGGCCTGTCCTCTGCCGCTGCCACCCCAGTCCAGTTTTCTCCTTTGTGGTCTGTCTGGATGCAGATCCCTGTGCTGTACAGAGTGGCCAGGGTCTCCTGCCCCCAAACACTGGGCATCTGCTGTCGTGCCAGGCACTGTGCTCTGGGCCGCAGCCAGAGAAGAAGAGACAGACCCCTGCACTTGCAGAGTGCGGCTGGAGAGACAGGGAAGGGGCTGGAGAGCTGGGTGTCTCCACGGGGTGGCAGGGAGTGGCCACCAGCGAGGGATCGCAGGCACAGATGCTGCACCAGTGATCAGGGACTCGGGGAGGGAGCGTTCCAGGCCAAGGGAACAGGAAATGCAAAGGCCCCGAGGAGTGGGCCACGCATCCATGTGTGCAGCGGGCACTGCGCTGGGAGCCAGAGACAAATGCTGCCCTCCTGGTGTTGACCTGTAACCGACAGAGCTGAGTGAAAGGCGGCTTGGATTCGATGAAGAGGCCAGTGAGTGGCTGGGGCTGCGCATGCCAGATCAGCCACTGCCGGGGATGCATCCTGGAGGGGTGTTTAAGTGAAGACCAGGAGGAGGAGCTGCGCGGTGTCTGGGCAGAAAGGGTGTTTCAGGCAGAGGGGCCTCCTGACGTGGCCAGTGGCTTGTGTGGCTGGAGGCCAGGGTGTCTGGACAGGTGAGCCCGAGCAGGGCTGGCCACACAGGTCCTGAAGGTTTGCCTGTGATTCCTGCATTCTCCAAATCCCTTCGCCACACAGCAGCAGAGCATGCTTTAAAGGCATGAACCAGGCCAGGTGACTCCCTTACCTGGGGCTCTTCAGGGGCGTAGGGGCTGCCCGCCTTCCACTGAGCCTGGGCCGCTGTCCTTTGCTTGCCAGGCTCTCGGGCACAGATGCCCCCACCTCGGGTCTGTGTCTGCTGCTCCCGGGGCCTCTGCTGTGTTGGTGCAAGTGTTCTCTGTATCCTCTTATCACGGAGGGAAGGCTGAGCCCACTCCCTTGCTGGATGATGGTGGCTGCAGTGGTCTCCCGTCTGTAATCACAGGGCACACATTTGCTGCCTGTGTCTCAAAGGGTGGGCTCCTCAGCAGGACACGAGAGAGGGTGGCTGGGTGATCTCAGCTCTCGGGACTGCGGGGTTCGTGCTTCCGTCTCTCCCGGTGGCAGCAGGACCAGCTGTCATGGCAGGCACACCTGTTGACCATGCGCTGTCATGGGCATTTGCCACGTCCATCCTTGGCTTCCGGGTCCCTGTCCTGAGCCGGGCGTGGCCACCTTGTGTCTTTCAGGTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATGTAAGTAGCACATGTGATGTCATTTGTTTTCCTTTTTTAATGCAAGATTCCTCGTTGTCCAGATAAACTTCGGATGTTCCTTATGTTTAAAAAAAAAAACTTTTTTTCCCTTCCATGCTTCCAGCCAGTGTGCCCCTCAGCCTGTTGGCTGGAGGTTGACTAGGGTCTGAATTGCGCAGTGGGCCGTGAAGGTGCGGCTTCTGTTACTGAATATGAGCCCTGGAGACCCGGATCTGACAGCGGGAGCTCCGAGGGGATGTTTTTCCGGAGCTCCGAGAATGATGTTTTTCAAAGAAACACTTTTCCGTGGGTGGCGCTCAGAGTGGGTCTGGAACCCGGCGGTGCTCCCGAGCGCTGTCTCCGGCTTGAGGCCCGGTTCTGATGCAGCCTCTTGACTCTGGGCATTTCCTATGTGTCTGTTTCCTCATCGCTGAAATGGGCATAGTAAAAGCACCCATCCCACAGGGGCATGAGGGCATCTGAAGGTTGCAGGTAGAGGAAGCGGTGCCCCAAGTGCCGACGGGCCCACCCCGGGGCTCGGTGTGTGCTCAGGATGGGGGTCAGGACAGGTGCAGCCTGGCACACAGGAGGCGCTCCCCAGGAGCCCAGGGGCGTCCTTGTTCCACAGCCCCTGCTTCTGCTGTGATGATGGTTCTTCCACAGCCGGAAAGTCTAAGGGTACTGACGCTGAGGTGGAAGGGATTGTGAACTCAGATGCTGGTAGTCGACAGAAAAGTGCTGAGGAGTTGGAGCTGCTGAGATTGCAGCTAGGACCTGTCCATGTCCCTCTCCAGTCAGCCCCTGGCACGTGGGGTCCACCCCCCACCTAGTCGGGCCTGGCAGGTGATGGTGCCACTCTCATCCGGGGCACTTGCGGGCAGGCCCCTCGCTGCGGCTGCCAGGCTTTGCTTAGCTCTTCCTGCCCTTGGGCCGCACTTTCCTCCCCTTTGAACAGAGGAGCTGGGTTCGCGATGCCCGATGCAGGCACAGCAGCCTCTCAGCCGCGTGCGTACTTCCCGAAAGGGTGACAATGGCGTGTTCTTCCTGTTGGTGTTCTAGATGAGATCGCCTCTGTCCCAGTCTCCTTACAGACACTGAAACCTGTTACCGACAGAGCAAACCCGAAAATCGGCATAGGAATGCTGGCATTTAGTCCTGACAGCTACTTCCTGGCGACAAGGAACGGTCAGTTGTGCTGACGCAGGTGCTGTCTCACCCTTTACTGTGTCCTGTGGCCCCAGGTGTAGAAGCGACTGGAAAAGAAAATGAAGTTGGGGGTTTCCGACACGTCACCTCCTTTCACGTTTCTGCAGTAGCCGAGGTGCTCACAGAAGCTCCTTGGAGGCGCTGGGCCTTTGTCCTGCAGCAGCCGCAGGTCCGCGCATGAGTCAGGAGGCCTCCACCCTGCTCACTTGCTCCACTCTGCTGAGTAGAAAGCAGGGCTGGGCACACTGCAGCCCGCCTTTTGTTAAGGGTTTCTCCATTTGTAAAGGGCTAAAAAAAAAAAAAAAA +>ENSE00003789737 +ATGAGATCGCCTCTGTCCCAGTCTCCTTACAGACACTGAAACCTGTTACCGACAGAGCAAACCCGAAAATCGGCATAGGAATGCTGGCATTTAGTCCTGACAGCTACTTCCTGGCGACAAGGAACG +>ENSE00001852362 +GTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATGTAAGTAGCACATGTGATGTCATTTGTTTTCCTTTTTTAATGCAAGATTCCTCGTTGTCCAGATAAACTTCGGATGTTCCTTATGTTTAAAAAAAAAAACTTTTTTTCCCTTCCATGCTTCCAGCCAGTGTGCCCCTCAGCCTGTTGGCTGGAGGTTGACTAGGGTCTGAATTGCGCAGTGGGCCGTGAAGGTGCGGCTTCTGTTACTGAATATGAGCCCTGGAGACCCGGATCTGACAGCGGGAGCTCCGAGGGGATGTTTTTCCGGAGCTCCGAGAATGATGTTTTTCAAAGAAACACTTTTCCGTGGGTGGCGCTCAGAGTGGGTCTGGAACCCGGCGGTGCTCCCGAGCGCTGTCTCCGGCTTGAGGCCCGGTTCTGATGCAGCCTCTTGACTCTGGGCATTTCCTATGTGTCTGTTTCCTCATCGCTGAAATGGGCATAGTAAAAGCACCCATCCCACAGGGGCATGAGGGCATCTGAAGGTTGCAGGTAGAGGAAGCGGTGCCCCAAGTGCCGACGGGCCCACCCCGGGGCTCGGTGTGTGCTCAGGATGGGGGTCAGGACAGGTGCAGCCTGGCACACAGGAGGCGCTCCCCAGGAGCCCAGGGGCGTCCTTGTTCCACAGCCCC +>ENSE00001924010 +GTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATGTAAGTAGCACATGTGATGTCATTTGTTTTCCTTTTTTAATGCAAGATTCCTCGTTGTCCAGATAAACTTCGGATGTTCCTTATGTTT +>ENSE00001659258 +GTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAAT +>ENSE00001813324 +GTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTAAGTCTGGAACACGTGTTTCTGCCTGAGCAGGCTGTTGGGGAGGGCGGTGGGAAACTGCTCCTTCACTTTGCTTTCTTG +>ENSE00003685083 +GTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATA +>ENSE00003653006 +GTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATA +>ENSE00001866903 +GTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCA +>ENSE00003492457 +TACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAG +>ENSE00001896684 +CCAGCTTTTCCACGGCCACGCGGACAGTCCTGCCAGCTTTGTGCTATCTGCACCAATGTCACTCTGCAGCACCCGCGTCTGTGGTGTGTTCCTGGCGACGGGGGTGTATTCATTATTAACTGAAATGTCTCATCTGCAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAG +>ENSE00003669982 +TACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAG +>ENSE00001839399 +AGTACTAGCTGGCAGTTCCAGCTTTTCCACGGCCACGCGGACAGTCCTGCCAGCTTTGTGCTATCTGCACCAATGTCACTCTGCAGCACCCGCGTCTGTGGTGTGTTCCTGGCGACGGGGGTGTATTCATTATTAACTGAAATGTCTCATCTGCAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAG +>ENSE00003387437 +TACAAGATTCTGCTGTACTCATT +>ENSE00003480267 +CATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAG +>ENSE00003485438 +CATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAG +>ENSE00001857368 +GAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGG +>ENSE00000734306 +GAATCACCTTCACCAGGGACGGCCGCTACATGGCGCTGGCAGAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGG +>ENSE00000734303 +CTGCGGATAACCGTCTGGTCCTTGTGCACAAAATCCGTGTCTTACATCAAATACCCGAAAGCTTGTCTGCAGG +>ENSE00001854631 +GTGGGAAGCAAGATGATTCCCTGGTAGGCTCCACGGGGTCTCAGTGGGAAATGCAGGTGGAGGGACACAGCAGCCCTGGAAGTCCCGCGGCGCTGCCACGGGGAGGGCTGGACCACCCACTGCGGTGCCTCTCCCTCAGCAGGCACGCCCTCGTCGGCCTGGTTAGAAAATCATCTTTTGGCCTCACTGTGCCAGCCTAGTCAGCTCTCAGCTCCCTGAGTCAGGGAAAGGGGTGGAAAAGTGGACAGTCCAGCAGCGCATGTTCTAGAACCCTCTGCAGATGCAGCCAGGCCAGCGAGCACACGCAGGAGGCAGACGGACACCTTCTTGGGTGTTGAGTGGCTGCTCCTGCCTCAGGGCTGCAGATGCAGGCTCACAGCCCCCTGGTGAGTCCCGGAGTGGCTGCATCCAATCTCCAGATCCTCTGTCTTCCCATAAAGGAGACTGAACCCGTGGTGGTTTCTAGATCAAGATTTTTCTCTGAGTAACTCAGGGTTATTATAACATGCAACCTATGGTCACTTTGAAAAAGCTAATGAAAAAGCACTTGGATTTAACTTTGTGTCACTCAATTTTGGTATAAAACAACAACAACAGAAAACCAAGAACACCAAATTTACCGTAACCACAGTAAAATACGCATTTGAATATTCCGGTAGGAGGGCAGGCATCCCCCAGGTCCTGATAGATCCACTCCAGCAGTCAGGCCTGTGCTTGGGGACGCGTGGGCGGGTTGAGGATTGAGACGGTCTCTGATGATGCTAAAGAAGTGTTTCCTTTCTCTTTCCCCTTTCCCCCAACAGCTGCGGATAACCGTCTGGTCCTTGTGCACAAAATCCGTGTCTTACATCAAATACCCGAAAGCTTGTCTGCAGG +>ENSE00000734299 +GTCTGGTCTTTAGAGCAGCCCGAATGGCACTGCAAAATAGACGAGGGCTCAGCCGGGCTGGTGGCCTCGTGCTGGAGCCCGGACGGGCGCCACATTCTCAACACCACGGAATTCCAT +>ENSE00001931622 +GCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAGGTGTGTGCTGCCGTGTCGCTTAGAATCTGGACACCTTCTGAGGGCCCCTGGGAAGGAGGGGTTTTGTTCTGTGCCTTTCTAGTTTGAAAAAAAAGTCCGTGCAGCTCAAAGCCAGTTTTCTTTTGAAATTATAACGTTCTCTAAAGTTTAAGAACATTTAAA +>ENSE00003566716 +GCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAG +>ENSE00003677298 +GCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAG +>ENSE00001870155 +GCGCCCAGGGGTCCCGCGGGTTTTCGGGCGCAGGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTG +>ENSE00001477063 +GCTGCGCGCCCAGGGGTCCCGCGGGTTTTCGGGCGCAGGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTG +>ENSE00001680820 +GGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTG +>ENSE00001748742 +GTTGCAGCCTGCTGCGCGCCCAGGGGTCCCGCGGGTTTTCGGGCGCAGGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTG +>ENSE00001836154 +TGCGCGCCCAGGGGTCCCGCGGGTTTTCGGGCGCAGGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTG +>ENSE00001858739 +TCCCCGATCGCTCTCCCCTCACCTCCCAGCTTCGGAGCTGCGAGCCCAG +>ENSE00001475277 +GATGCTTCTGGCTGGCACACCTGGCTTCCCCTCCATGCTCAGAACTGCTTCCTACTCTACATCCAGGCTCCTGAGCAGCCCCCAGCTTAAGCTTCAGCAGCTCCAGGGTAAATCCATCTCCGCCCAGAGCTGACTCCGGATCTGCCCCAGTGACAATAACAAGATAAATGCCTTCCATTCTCTTCGTACTTACAGGATGTAATCCACATATTTACACAGTGTTTCATTTGCGGTAATGTTTGTTTTGTTTCTTGTTCCTTCGTACCTATCTGGGAAGCCTGTGCAATTCAGATGTCCAGGCCCACTTCCAGAAGTTCTCATTCCCTGTGCTTGAGTCAATGGCCGCAGACCATACACCTGAGAGCAAGTTAATCTGCTCTAACAAAGATATCACATCTAAGAATGGTGGTTGGCAGGGGCTGGGGGGTGGGAAGAATGGGGAGTTGGTGCTTCATGGGTACAGAGATTCAGTTTTGCAAGAGGAAAAGAGCTCTGGAGATGGATGCTGCTGATGGCTACACCGCAATGTGAATGTGCATGATGCTTAAATATGGTTAAGATGGGCCGGGCGCGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAGGCGGGCAGATCACGAGGTCAGGAGATCGAGACCATCTTGGCTAACACGGTGAAACCCCATCTCTACTATAAATACAAAAAATTAGCCGGGCGTGGGGGCGGGCACCTGTGGTCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATGGCATGAACCTGGGAGGTGGAGCTTGCAGTGAGCCGAGATCACGCCACTGCACTCCAGGCTGGGCGACAGAGCGAGACTCCGTCTCAAAAAAAAAAAAAAAAAAAAAA +>ENSE00001475269 +GATGCTTCTGGCTGGCACACCTGGCTTCCCCTCCATGCTCAGAACTGCTTCCTACTCTACATCCAGGCTCCTGAGCAGCCCCCAGCTTAAGCTTCAGCAGCTCCAGGGTAAATCCATCTCCGCCCAGAGCTGACTCCGGATCTGCCCCAGTGACAATAACAAGATAAATGCCTTCCATTCTCTTCGTACTTACAGGATGTAATCCACATATTTACACAGTGTTTCATTTGCGGTAATGTTTGTTTTGTTTCTTGTTCCTTCGTACCTATCTGGGAAGCCTGTG +>ENSE00001890428 +GATGCTTCTGGCTGGCACACCTGGCTTCCCCTCCATGCTCAGAACTGCTTCCTACTCTACATCCAGGCTCCTGAGCAGCCCCCAGCTTAAGCTTCAGCAGCTCCAGGGTAAATCCATCTCCGCCCAGAGCTGACTCCGGATCTGCCCCAGTGACAATAACAAGATAAATGCCTTCCATTCTCTTCGTACTTACAGGATGTAATCCACATATTTACACAGTGTTTCATTTGCGG +>ENSE00001475263 +TGCCTTGCGACAGCTACCGCGAGGGCTACAGCGCCTGTGTGGCGCGCCTGGCCCGCGTGCTGCCCGCCTGCCGTGTCCTGGAGCCCGCCGTGAGCGCGCGCCTGCTGGAGCACCTGTGGCGGAGAGCGGCCAGCGCCACCCTGGACGGCGGGCGCGCTGGGGATTCCAGTGGCCCGTCTGCCCCCGCCCCAGCGCCCGCGTCTGCCCCAGAGCCCGCATCCGCTCCGGTGCCCTCGCCGCCCTCGCCTCCCTGCGGCCCTGGCCTCTGGCGGCCGTGGTAGCCCCTCGGCCGATCCACAGACCCTGCCGACTGCTTGGGACCTTGGGGCACTGGACAGGTTGAAGCTCTTGGTGGCGGCTGCTGTTCCCATCATTAGGGGCCAGCCCAGTACCCACACCCAGGCCGGAAGCCGGCTGTTTGTGACTGGCGTGGCAGACTGAAAGCCCTGGGGCTGGGGCTCGGCTCAGGGAATAAAAGGAGCGTCCCTGCTTCACCCCCAACTTGGCTGGAGAAGAAAGGACAAGAGGCAGCAGGGTGAAGAAGAAGCCCCCCATCCCAGCTGGTGGAGATAGTTCTGGAACTGGACCCCGCAGCTGCGTGGGCAGCCGACACACCCACCCCAGCACTGGCACCAGACCAGAGCCAGAGCCAGGACCTGGGCAAAGTGCAGCCGTGCACCCTGCCTGGTCACTGCTCTCCCAGCCCTGCCTGGGCCTACCTCCTGCCCAGCTCTGCTTGGGACCCTCTGGGCATGCAGCAGCAGTAGCCTAAGGGCTCTGGTCACTTCCAGGGCTCTACAGGGCAGCAGAGCAGAGCAAAAGGGTGCATATGCTGGGAGCTGTCACCTCCACTCCTAGGCTTTTCTGCCTAGAGCAGAATTATAGGGGCAGTATACATCCAGGGGTCTGTGCGGTGGGGCTGGGGGATTCCTTAAGTGACTTTGGGAAGGATTTGTTTTCCCGAGCATCAATTTCACACCTGGGCATTGCACCCCAGGCTATGCAGTCTTTCAGTGTGAGGAAGGGGCAGAACAAGAATGAGGCGGCCCCGTGGCCTCAAGGAAGCTTGTGGCTTTGGAGGATCTGACTCCAGCAGAGTCTGTGCCAATGTGGGGTGAGCAGGGCCCCTGCCATGGAGCAGCAGGAATTTGAGGGATGGAGCAGGTTAAAGAATGGGAAACATCTTCACTTGTTTTTTTTTCTTGCAAACTACTCCCTGCTACTCATTGAGACTGGTTACTGGAAGCAACTTGTTAAGATTTTTCTTTCTGGGCGGGCGCGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCAAGGCGGGTGGATCACCTGAGGTCAGGAGTTCGAGACCAGCTTAGCCAATATGGTGAAACCCCGTCTCTACTAAAAATACAAAAATTAGCCGGGTGTGGTGGCATGTGCCAGCTACTCGGGAGGCTGAGGCAAGAGAATCACTTGAACCTCGGAGGCTGAAGTTGCAGTGAGCCAAGATTGAGCCATTGCTCTCCAGCCTGGGTGACACAGCAAGACTCTGTCTCAAAAAAAATTTTTTATTTCTTTCTTTTCCATGGAGGCCTAGAGTCCCTGTGAAGGCTAGGAAGGGGCTGCTGATCCCAGGAGTGCCCACGAGGAGTGGGGGGCACTGTTGGCCCATAATCAGGCAAACACCCATCATTTCATGGGGGATTCATGAAATCATAGTCAGGCAAACACCCGTCATTTCATGGCTAAGCATTTGCAGAAGGTGGAGGATTCTCCCCCGAGTCCCCAAATCAGCAGCCTGTGCTAGGGACCAGAGCACCGGGGGCAAGAAGACAGAACCAATGTGGGAGTGGGGATGGTCACTAAATCTGACTGTGCCACACAAGCCCATGATGACCTTGGCACTGGTTTGGGTGGCAGGATATGAAGGAAGCTGTAGGCATTATTGAAAAAATCATTGTTCAGCCAACAGGGTGAGGCTCCCAGCAAGGCCGTGCCATCTTCCCACCTCCCTGTGCCCAGAGGGTTAGACTGTAAGCTCCCGGAGGGCGAGGCTGGGGCTGAGCGTGCCTCCACGTCCCCAAGGCACAGGGTGCACAGTGGGTGCTCACTGAATATAGTGGACTAGTGAGCAGAGGATGAGAGGACTACCCTGTAATGAGCCTTGGACAGTCTGGCATTTGCCTTAACTCCCACTCCCATGCCCTGGGATCACTGTTGGATATTTACTCCATGAGGACAAATACTGGGGAGGTGTGGAGAGGAGGGAGGGCAGGTTCCTCTTACTTTCACCCATTGCTGAGAATGAGCGCCTGTTGGCACTGCCTTTGTGAGCCTCCGGGAGCAGGTAACCTGCGGCCCAAGCCCGCCTAGGACTCCACATCAGGCAGGCACAGGACTGGCCCCTTGTCCTCATAAAAACTCTCAGTACAGCTTAAACTCTGTAAGATCTAACCAGCCAGGAGGACCCTCGCTTCCTCTCCGCCATGCTTGCCACCTCTTGCTTCTGAGAGTCCATCTCAGTTCGCAGTTCTGTGACTTGCATTGACCTGGCTCCAATCAAGCTACAACTCAAGCAGTCACGGGGAGAAGGATTGTAGATGGGCCAGTGACTCACAGGGTCAGGCACTCGGGGGAGCCTGAGTCAGGAGGTCAGTGGGCCCTGGAAGGGAGGGGGCAAGCCTGGGTGGGTAAGGTTCTGGGCCCCAGGCAAGAAGGCAGAGTTTCTCCGCAGGGGTGTGTGCAAGAGCTAGCTGCGCAGAAGGTCTCCGCTGGCTCTCCAAGCCGGGCTTGTGAAATAGGAACGCCAACATCCTCCTCCACAGGCAGTGGCAGGCACCTCCTCCTCAGGTGCCCCCCAAGCCCTATCTGATGGGCAAAGGTGAACGCAGGGCGGTGGGCTTTTCCTGTGCAGAGGGAGACTGATTCAAAGGGTCATTTATGACCTTTCACAAGTCCCACATCCTGCCCAATGGCCAGGTCTTGGGATGCTGTTGCAAGATGGTTCTGTGACTCCATGTGACTGTCTGATGATTGCCCCAGCTGGGGAAAAGGCTCCCATGTCTCTTTCTCATAAAACCAGTGGGCAAGGCCGGGCGCAGTGGCTCACGTCTGTAATGCCAGCACTTCGGGAGACCAAGGTGGGCGGATCACCTGAGGTCAGGAGTTCAAGACCAGCCTGACCAACATGGTGAAACCCCGTCTCTACAAAAATATGGAAATTAGCTGGGCATGACGGCGGGTGCCTGTAACCCCAGCTACTTGGGAGGCTGAGGAGGGATAATCAGTTGAACCCAGGAGGTGGAGGTTGCAGTGAGCCGAGATCGCGCCACTGCACTCCAGCCTGGGTGACAGAGCAAGACTCCATCTCAAAAACAAACAAACAAAAAACTAGCGGGTGAAATGATTCAGTGACCTAAGGACAGCCAGAGCACTAAGCTGCTGGGAACCCATCTGTGCTGAAATGTAGATTTCCCAGGAAACTCAGGCTTGGGACAGGCGCCTACCTGCTCCTCGGGCACCAGGTGATTAGGAGAGGTCGAATCTCATTTCCACGTGAGTGAGGATAAAGACTGGGCTGCCAAGGAGGACTCCTCATAAACATTGACAAATTGCTCTGCCCCGCCTGTGATCCCAGACGACTCCTGCAGTCTGGGATCCTGAGTGTCCTGTGGGTTCATCTCGGATGGGCGCTGCATAAACAGCCTGCAGGGAACGTCTGGGAGAACCAGCTTCACAACAGATATAATAAGGAAGAAGTTTGAAATATTGCAAGAATTGCGAAAGTGTGACACACAGATACAAAGTGGGCACATGCTCGTGGGAAAATGTTGCCAATAGACTTGCTTGACTCTGGAGTTACCCCGAACCTTCAATTTGTTTAAAAAAAAAAAAAGGCAATATCTTGACGTGCAATAAAGTGAACTGCAATAAAA +>ENSE00001948071 +TGACTTGCATTGACCTGGCTCCAATCAAGCTACAACTCAAGCAGTCACGGGGAGAAGGATTGTAGATGGGCCAGTGACTCACAGGGTCAGGCACTCGGGGGAGCCTGAGTCAGGAG +>ENSE00001854189 +TGCCTTGCGACAGCTACCGCGAGGGCTACAGCGCCTGTGTGGCGCGCCTGGCCCGCGTGCTGCCCGCCTGCCGTGTCCTGGAGCCCGCCGTGAGCGCGCGCCTGCTGGAGCACCTGTGGCGGAGAGCGGCCAGCGCCACCCTGGACGGCGGGCGCGCTGGGGATTCCAGTGGCCCGTCTGCCCCCGCCCCAGCGCCCGCGTCTGCCCCAGAGCCCGCATCCGCTCCGGTGCCCTCGCCGCCCTCGCCTCCCTGCGGCCCTGGCCTCTGGCGGCCGTGGTAGCCCCTCGGCCGATCCACAGACCCTGCCGACTGCTTGGGACCTTGGGGCACTGGACAGGTTGAAGCTCTTGGTGGCGGCTGCTGTTCCCATCATTAGGGGCCAGCCCAGTACCCACACCCAGGCCGGAAGCCGGCTGTTTGTGACTGGCGTGGCAGACTGAAAGCCCTGGGGCTGGGGCTCGGCTCAGGGAATAAAAGGAGCGTCCCTGCTTCACCCCCAACTTGGCTGGAGAAGAAAGGACAAGAGGCAGCAGGGTGAAGAAGAAGCCCCCCATCCCAGCTGGTGGAGATAGTTCTGGAACTGGACCCCGCAGCTGCGTGGGCAGCCGACACACCCACCCCAGCACTGGCACCAGACCAGAGCCAGAGCCAGGACCTGGGCAAAGTGCAGCCGTGCACCCTGCCTGGTCACTGCTCTCCCAGCCCTGCCTGGGCCTACCTCCTGCCCAGCTCTGCTTGG +>ENSE00001914446 +AACTCCAACTGCTCGAAGCTAGAGAAGGCAGACGTCCTGGAAATGACCGTGCGCTTCCTGCAGGAGCTGCCTGCGTCCTCATGGCCCACGGCAGCGCCCCGTGAGTGAGCCCTCCCTGCCCTGCCGCGCGCTCTGCACCCCGCACCCGGCACCCTACCCCGCGCCTCACGCGGCTCTCCGCCCGCAGTGCCTTGCGACAGCTACCGCGAGGGCTACAGCGCCTGTGTGGCGCGCCTGGCCCGCGTGCTGCCCGCCTGCCGTGTCCTGGAGCCCGCCGTGAGCGCGCGCCTGCTGGAGCACCTGTGGCGGAGAGCGGCCAGCGCCACCCTGGACGGCGGGCGCGCTGGGGATTCCAGTGGCCCGTCTGCCCCCGCCCCAGCGCCCGCGTCTGCCCCAGAGCCCGCATCCGCTCCGGTGCCCTCGCCGCCCTCGCCTCCCTGCGGCCCTGGCCTCTGGCGGCCGTGGTAGCCCCTCGGCCGATCCACAGACCCT +>ENSE00000734533 +AACTCCAACTGCTCGAAGCTAGAGAAGGCAGACGTCCTGGAAATGACCGTGCGCTTCCTGCAGGAGCTGCCTGCGTCCTCATGGCCCACGGCAGCGCCCC +>ENSE00002817476 +AGCCTGAAGCCGCTGCTGGAGAAGCGCCGGCGCGCGCGCATCAACCAGAGCCTGAGCCAGCTTAAGGGGCTCATCCTGCCGCTGCTGGGCCGGGAG +>ENSE00001916716 +CCAGCCCGGGCCGCGCCCGGGACCTCATTTCGGACCTCGGTTTCCCTTTGCGTGGGGCTCGCAGCTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAG +>ENSE00001475267 +ACTCGTCTGGCACCAGCCCGGGCCGCGCCCGGGACCTCATTTCGGACCTCGGTTTCCCTTTGCGTGGGGCTCGCAGCTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAG +>ENSE00001475271 +CCCGGGCCGCGCCCGGGACCTCATTTCGGACCTCGGTTTCCCTTTGCGTGGGGCTCGCAGCTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAG +>ENSE00001835288 +TCGTCTGGCACCAGCCCGGGCCGCGCCCGGGACCTCATTTCGGACCTCGGTTTCCCTTTGCGTGGGGCTCGCAGCTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAG +>ENSE00001475281 +CTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAG +>ENSE00001150483 +CGCGGGGACACTCGTGCGACTGGGGCAAGGTGCCCAGGGGCTTCTCTCCTAATTTGCCTCACGTAACAGTTGAGACCCCAGAGGGCAGCAAAACTGGGTTCGAATTGGAGAGCCGTCCAGGCACAGACAAATTCATTCATCTGCCCAGTGCCCGCTAACTGCGGTTCCAGGCGCCGGCGACGCAATTCCAGAG +>ENSE00003790229 +GTGCTGGGGAGAGGCAGGACAGGCCTGTCCCCCGAGTCCCCTCCGGATGCCGTGGACCGGCCAGCTGTGAGTGTTTCTTTGGCAGTGTCTTAGCTGGTTGTTGTGAGCAATAGTAAGGAAGCAATCAGCAAGTATACTGCCCTAGAAGTGCTGCACGTTGTGGGGCCCAAGAGGGAAGATGAAGCGAGAGATGCCCAGACCAGTGGGAGACGCCAGGACTTCGGAAGCTCTTCTGCGCCACGGTGGGTGGTGAGGGCGGCTGGGAAAGTGAGCTCCAGGGCCCCAGGAGCAGCCTGCTCGTGGGTGCGGAAGGAAAAAGGCACAGGGGCTTGGTGTGGGCGGCTTTTGGCTGGGAGAAGTTTGCACGTAGGGAGAATAGTAGCCAGTGTTTGCAGAGCACTTACTATGCAGGAAGGCCTGTCCTAAGTATTGTAAGTGTATTACATCATGTACAAGTGTCTGTGATTAACCCCGTCTTGCAGAGAAGGAAACAAAAGTACAAACAGAAAATGTAACTAAGCATGCAATTAATAAAAAGGGACCAGGTTTTGAACGCGAGCAATCTGGCTCAAGAATCTGCGCCCAACCACCGGCTCCTGTTCTTAGAGATGAACGTGGAGTCCTGGAGACTGCTCAACATTGTGACTTGACTGTGAGCGTACGCGCTCCCTGTCCCCAGGAGACAGATTTCCAGTGCAATCATAGAAAGTGCCTGTGTGGGCTTCGGGAGATGTGTCTGCCTTGGGGAGAATTTTCCTTTTCAGCTAGAGCCAGGCCCAGGATGTTGACGTCAGTGAGACGCTGGTGACGTTCTCTGCTCCAGTGGCTGATGAGAAAAGTTCCTCCAAGCCAGCTCAGTTGAGAAGAATTAAGTTCTCTGGGTCCCACTGGCTTCACCTACAGATGCCAACTTTGAGGCCAGTGAACTGTGAGGCCAGCTGGGCTGATTGCCATGGCAACAGGAATTGGACCAAAGTCACCGGAGGATGGAGAGGGAAGACACAGTGGTGGCTTCCCCAGGTCTTGGACCACAAGGCACAGCCGTGGCCTCCAGGAACCCTGAGATAACCCGTTAGTGGGTCCTGCACTCCAACAGAGCTCATGCAATCAGCCTCTGGTCCTCACCCTCCTCCCATTGGTGTCGTTGTGCTCTCTAACATTGACATTGAGCAGTGAGTGCTCCAGATCTTGTTCCACTGATTTTTTCCACTGTTCTCCAGTCTAGCACTTTCTGAAATTCATCCAAGCCTAAGAGGTGACGCCAAACGTAAGTGTCTTACACCTCGGACCCCATGGACTAAGACAAGCCTCTGGGGTCCATGTGGCACCAAGGATGGGGCCTTCTAGTACCTTTCACACAGGCCAGGGACAGCACCTGCTGCGACCCCCACCCCCAGCCTCTGCTGCTTCTCCCGTTGCCCTTCCAGCCACTGCCCTGGGCACCTCCCCTGCTCCCGCCTCCCTGCCTGGGCCCATCTTTCTTTGCACCTCACCAATTGCGGGGCTTCCTAGTGCTGGAGGGGAAGGGAGCCTGCTTCCATTCTCACCACTCTGAAAGAAGACCCTGCAGAGAGGTTTTCTGGAATTTGGAGCCTAACCTTGGCCTTGACACAGTCCAGATGAGAAGGCCGTCCCCCAGTTAAGCCAGCCCTCCCTCCCTCTCAATGCTGGAGAGGAAACCAGGCAGCTGGTTGCTTCAGCAAACCCCCTCCCTATGGGAATTGTCCTTTTCTTCCTCAAATAGACTGGAGTGCAGAGGACTTGCTTCAGAGAGAGCCCCTTTGTAACGCACATTGCACGGGCCGTGCCCCATGCCCACTCTGCCACAAACTCCCCTCAGCTGCCCAGCCCCGTGGAGCCAGGCGTGGGCTGAAGTGGGGCCAATGAAATGCCTGGAATGCCAGCCGCAGTGACAGGCCAGCACTCAGATGCCTCTCGGGAGTTCTGACCGAAGCAGCACTGAGGACTGCTTCAGAGCAGAAGTCTACGCCATTTTCCCCAGTTCTAGGCAGAAGTAAAGAATGTCTCTACCTTCTCCCAACCAGCAATTGATTCAGAGTCCTGAGCTTTTAAATTAAAGGGACCCCTCTGTTGCTTTATGCAGTAGCCAGCTTATTCATTTGAGTTCAGGTGAAATCATTTTCAAGTAACCTCTTCCTATCCAGCTTTACTTTTAGTTATGCTGACATAAAAACAATAAAAATTGTCCTCCTCAGAGTTCACCTGTAAAAGTTCCTGGATAATTAGTAAGGAAACAGAAAGAGCAGATAGTTGTTGCTTCAGATAAAAGTGATGTCTGGGTTGGGCACGGTGGCGCATGCCTGTAATCCCAGCACTTGGGGAGGCCCAGGTGGATGGATCCCTTGAGCTCAGGAGTTTCAGACCAGCCTGGGCAACATCTCTACAAAAAATACAAAAATTAGCCAGGCATAGTGGCAGGACTGTAGTCCCAGCTACTCAGGAGGCTGAGGTCAGGGGATGGCTTGAGCCCAGGAGGCACAGATTGAAGTGAGCTGAGATTGCGCCACTGTATTCCAGCCTAGGTGACAGAGCCAGACCCTGTCTCAAATTAAAAAAAACTCTTTGTGGTCATTTAATTTACTTCTGCATTCTTTTTTTTTTTTTTTTGAAATGGGCAGTGGTACCATCTCAGCTCACTGCAACCTCTGCCTTGGGGGTTCAAGTGATTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGATTACAGGCACCCGCCACCACGCCCAGCTAATTTTTGTATTTTTAGTAGAGACGGGGCTTTGCCATGTTGACCAGGCTGGACTCAAACTCCTGACCTCAGGTGATCCGCCCACCTCGGCCTCCCAAAGCACTGGGATTACAGGAATGAGCCACTGCACTCGGCCTACTTCTGCATTCCTTAGAGTACATCCTAGCTAGGATATATTCACTTGTCTTTAGAGCTAACAGCAGAAGAAAGGTACCTAGATGCTTATCTAGCTCTTTATCTTTCTAGAAATTCTAGAAGATGAGAGGGGCAGTGGTGGCTCCAAGGGAGTGATTTTAGGATGGACTGGGACAGAGAGGGGCTGCTTACACATACTCACACAGAGGCCATTAATTTAGGGAGTTCAAGGTCCAGGAGGTTGACGGCATCTAGGCCTGTGGCAGAGTGCACTCCTGCTTTGGGGAATGTATGGGCAGCTTCTTGCCTGTAGTTGGAGGGTTAGAGAGAGGGATCAATAATTTCATGGTTGGACTTGAGTTTGGAGCGAGTGGAGTTAGATACAAATTCTATGTTTTTGGAGAAAGTATTTGATCTTCTTGGCTGTGAGGCAAAGCGAGGTTTAAAAATATTTTTCACTTAAAAATATATATATATGCATGTATATTTAATACTGTCTATGGATTGTGCCAATATCTATTTCATGGTTTTGATATTGTGTAGTTATACAAGGAGTTACCACTGAACGAAACTGGGGGAAGGGTACACAGAATCTCTGTACTTTTTTTGTTGTTGTTGCAATTTCCTGTAAATCTATGATTATTTTAAAATAAAAAAGTTAAAGCATACGTATTTACATTTGATTAAATGCAGTGTGATATCCTGGGTTGGATTTTGGAACAAAACAAGGCATGAGTGAAAAAACTGGTAAAATCCAAAAAAGCCTTTAGTTAAAAGTAATACCAGTGTTAATTTCTTAGTTTTGACAAATGTGCCATGGCTGTGTAAGATGCAAATGTTAGAGGAAACTGGGCGAAGAATTTGAGGGAACTCTCTGTACTATTCTTTGCAGCTTTTCTGTAAATCTACAATTATTCCAAAATAAAAGTCTATTAAAAATGTAA +>ENSE00001500136 +GGCCAGCTGTGAGTGTTTCTTTGGCAGTGTCTTAGCTGGTTGTTGTGAGCAATAGTAAGGAAGCAATCAGCAAGTATACTGCCCTAGAAGTGCTGCACGTTGTGGGGCCC +>ENSE00003787977 +GACCCCTCCCCCGCACCGACGTGATTCGGATCGCGCGGTGCTGGCGCCGCCTTCATGCGCCCTGCCTGGCCCCCACCTGGTCCTCTTTCCTTTTCAGGTGGAGGAGATGCCGCTGTCCCGTCGGTCTGGGGACAGCCCAGCTCCCCGGATCCCGGGCTGGAGAGACGCGTCGCGGCCCCGGGGCCTGGTGGCACGAGCAGGAAGGAGGACCCGGCGGCGGGCTCTGCCTGGGCTTGCCTGGGCTTGTTCCGAGCCGGGCTGCTTCTCGGTGACCACGCAGATCGGGGGCATTTGGAGATTTTGCGGGAGTCCTGCAGCCAAGCTCCGGGGCAGGAGAGGCCTGGAAGCCTGCACTACCTGCTCGCCCCGTCCCAGCATGCACCCAG +>ENSE00001658885 +GTGGAGGAGATGCCGCTGTCCCGTCGGTCTGGGGACAGCCCAGCTCCCCGGATCCCGGGCTGGAGAGACGCGTCGCGGCCCCGGGGCCTGGTGGCACGAGCAGGAAGGAGGACCCGGCGGCGGGCTCTGCCTGGGCTTGCCTGGGCTTGTTCCGAGCCGGGCTGCTTCTCGGTGACCACGCAGATCGGGGGCATTTGGAGATTTTGCGGGAGTCCTGCAGCCAAGCTCCGGGGCAGGAGAGGCCTGGAAGCCTGCACTACCTGCTCGCCCCGTCCCAGCATGCACCCAG +>ENSE00001670416 +GAGGAATGAGTCCCCCGTTCTCACCCCGGGGAGCGGTTGCCTCGTGAGTCCAAGGAGAATCCGCCCTTTCGTTTTGCGCAGGTGGAGATCTCGCGGGCCCAGTTCGGAGTCCTGCAAACT diff --git a/pygtftk/data/mini_real_10M/expected_sequence_minus_exon_no_rv.fa b/pygtftk/data/mini_real_10M/expected_sequence_minus_exon_no_rv.fa new file mode 100644 index 00000000..e6b7ed1f --- /dev/null +++ b/pygtftk/data/mini_real_10M/expected_sequence_minus_exon_no_rv.fa @@ -0,0 +1,266 @@ +>ENSE00001611509 +AAAGGCTGAGTCCTCTGAGAATTTATTACTACGGATCACAGCAGCAACGGGCGGGAAGGGCGGCGCCAGACTCATTTGCCCCGCAGGTAGATCTTGGGGGTCTGCCAGCCTTCGGGGGCTTCCTTTAGCCCCGCCTTCAGCCAGATGCGCCTCAGGTCTTTCTCGAACTTGAT +>ENSE00001790281 +AGGCTGAGTCCTCTGAGAATTTATTACTACGGATCACAGCAGCAACGGGCGGGAAGGGCGGCGCCAGACTCATTTGCCCCGCAGGTAGATCTTGGGGGTCTGCCAGCCTTCGGGGGCTTCCTTTAGCCCCGCCTTCAGCCAGATGCGCCTCAGGTCTTTCTCGAACTTGAT +>ENSE00001842703 +GAGTCCTCTGAGAATTTATTACTACGGATCACAGCAGCAACGGGCGGGAAGGGCGGCGCCAGACTCATTTGCCCCGCAGGTAGATCTTGGGGGTCTGCCAGCCTTCGGGGGCTTCCTTTAGCCCCGCCTTCAGCCAGATGCGCCTCAGGTCTTTCTCGAACTTGAT +>ENSE00001629775 +CTGCTTGCGTCTCAGGCGTCCCTCCTGGACCTTCCTCCGCAGGAACCGCGTCTTCTTCACCAGCTTCCGGTACTTGTGGTGGTTCATCTTCCGCCGGCGGATCTTCAGCACGTTTTTGCACTGAATTTGAGGCGCATCCGCGACGCCTTCATCCCCCTGCTCGGCCCCTTCCCCTATCTGGCTGGGCGGACACTGGTAGGATTGCGGTGGAGCCACAGTCCCTGCGGTCCCGGTATCCAGTCTGGGCAGGAAGCAGCGGGCCGTGAGCCAGCTCTCCAGGGGGCTGACGGACATCTTCCTGGGGACCAGCATCTCCTCCAGCTCCAGCTGGGCCCCCTTGCGAGGGAGAGAGGCCGCCCTACCTGGGCCGGCCGGCGATGTGCTGTAAAGGGGCCCGCAGACCCGGCTGCCCAGCACTCCAGAGACGGGCCAAGGCGGGCGGCCGC +>ENSE00001922199 +GGCAGGAAGCAGCGGGCCGTGAGCCAGCTCTCCAGGGGGCTGACGGACATCTTCCTGGGGACCAGCATCTCCTCCAGCTCCAGCTGGGCCCCCTTGCGAGGGAGAGAGGCCGCCCTACCTGGGCCGGCCGGCGATGTGCTGTAAAGGGGCCCGCAGACCCGGCTGCCCAGCACTCCAGAGACGGGCCAAGGCGGGCGGCCGCCTGCAGAAAACCAGACGCCACGGTCACCGCTCGCGAGACCACACAGGCCCGTCGGGTTGAGGAGCAGCAGGTTCGTCCCAGCGAGGATCCCCCGCACCTCATTCCTGGCCTGAACCCCTGAGGTTCCCTCTGTGAGCATCGGAAGCTTAGAGGGGAAAGAGTGTGTGTGTGGCCACCGGCCCTGCCCCAGCGGAGCTGCTGAGACCCGCACTCCTAACCAGGTGTGCATCCTCCCATCCGCCCCCGCGCGGCTTCCTACCTGCCCAAGGAACGGCCCTCAACAGCTGGGAAGTCAGGCGCCCCAGGAGCATGGTCTGTGGGCGGCGGCCACAGGTCCCAGGGGAG +>ENSE00001821535 +GCGGCCGCCTGCAGAAAACCAGACGCCACGGTCACCGCTCGCGAGACCACACAGGCCCGTCGGGTTGAGGAGCAGCAGGTTCGTCCCAGCGAGGATCCCCCGCACCTCATTCCTGGCCTGAACCCCTGAGGTTCCCTCTGTGAGCATCGGAAG +>ENSE00001789693 +CTGCCCAAGGAACGGCCCTCAACAGCTGGGAAGTCAGGCGCCCCAGGAGCATGGTCTGTGGGCGGCGGCCACAGGTCCCAGGGGAG +>ENSE00001896016 +CTGCCCAAGGAACGGCCCTCAACAGCTGGGAAGTCAGGCGCCCCAGGAGCATGGTCTGTGGGCGGCGGCCACAGGTCCCAGGGGAGCTGGAACACAAGTGCCCGTTCAGGTCAGGCGGCAGCGCCTTCAGTAGTCGCGGGCGGGCCGGGACTGGGGCGTCTGGTCCCGCCGCGACCCTCGCTTCCCTTCTCCCTCCGCCACCCCAACCCACAAGGAGGACTTTGCTTCCAACACAGCTCGCGCCCCGAGGCTCCCAAGCCCCCGACGCGGGCGGTGTCGCGCTCGGACGCACCGAAAGGTCCCAGAACGGGGAGGCCGGCCCCCTCCCCGGGTTCACCCCCGCGCGAATCGCGTTGCCTGGCGCCCGGACCCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGCGCCCTCAGGCCTCCCGCTGACCCTTCCCAAGCCCGACCTCGAC +>ENSE00001223521 +CTGCCCAAGGAACGGCCCTCAACAGCTGGGAAGTCAGGCGCCCCAGGAGCATGGTCTGTGGGCGGCGGCCACAGGTCCCAGGGGAGCTGGAACACAAGTGCCCGTTCAGGTCAGGCGGCAGCGCCTTCAGTAGTCGCGGGCGGGCCGGGACTGGGGCGTCTGGTCCCGCCGCGACCCTCGCTTCCCTTCTCCCTCCGCCACCCCAACCCACAAGGAGGACTTTGCTTCCAACACAGCTCGCGCCCCGAGGCTCCCAAGCCCCCGACGCGGGCGGTGTCGCGCTCGGACGCACCGAAAGGTCCCAGAACGGGGAGGCCGGCCCCCTCCCCGGGTTCACCCCCGCGCGAATCGCGTTGCCTGGCGCCCGGACCCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGCGCCCTCAGGCCTCCCGCTGACCCTTCCCAAGCCCGACCTCG +>ENSE00001921648 +CGAAAGGTCCCAGAACGGGGAGGCCGGCCCCCTCCCCGGGTTCACCCCCGCGCGAATCGCGTTGCCTGGCGCCCGGACCCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGCGCCCTCAGGCCTCCCGCTGACCCTTCCC +>ENSE00001479025 +CGAAAGGTCCCAGAACGGGGAGGCCGGCCCCCTCCCCGGGTTCACCCCCGCGCGAATCGCGTTGCCTGGCGCCCGGACCCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGCGCCCTCAGGCCTCCCGCTGACCCTTCCCAAGCCCGACCTCGACGCGGCTCAAATTGA +>ENSE00001479027 +CCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGCGCCCTCAGGCCTCCCGCTGACCCTTCCCAAGCCCGACCTCGACGCGGCTCAAA +>ENSE00001697866 +CTCGACGCGGCTCAAATTGACCGTTCTGCGGCCGCCCTCGGGCACTTCCGGTCCGTCCCCAAGTCGGCCCCGATCGGCAGCGGCCACCCGGCGGTTCCTACGCACAGCGCCCGCTGGCGTCCTCGCGGCCCCCGATTCTGCATTGGCTCAGGCCCCGCCGGGCCCGAAAGGCGACGGTTTCCGGTTAGTGGAATCACGGTCCCAGTCCTCGCGCGGTTCCTCAGCTCCGCCTGGTCCCTTACGGAGGCAAAAAACTACATTTCCCACAATCCCAGGGGGTGCGGGCCCTGGATATACCCGCAGGTCCAGAATCGTTTCCGGACCACCCAGGGGCCGGATTCC +>ENSE00001478064 +ACCACTTAAATACAAACTTTATTCTCTCTCCAAGAAGATGCAGACGTCACAGGTGGCCCTGAGCTCCCACCCGAGGCTTAGGCCCAAGGGGCCTCTTCCAGGCTGAGGGCCTGCTGGGGCTGGGCCAGGGGCTGAGGCTGAAAGCAGCAGCCTGCCTAGTGGGTGACGCCAGGGGCCGGTGTAACATGGCACCGAGGTTGGGGCCACAGCAATGTGTGGGACGGTGGGGTGGGCTGGGGCCCTTGGCTCCAAGCATTAGTTCTCCAAGCTCTGGTCCGTTCTCCTACCTCCTTCAAGGGGCACCAGGGCTACAAGGTGGTAGTTGAGTATTGGGGCCCGACTCCTGGGGCACTGGAGTGGTCTCTAGGCCCGAGGCCCCAAGGAGAGGGCTGGGTTTCTGGGAGAGTGCTGGTCCTTCCTCTCTGGGCTTGGCCATCTTGACAGCTTCATCGTAGGAGGGTGGAGGCTCCGGGGTGTACAGGCTGTAGGCAGGAGGAGCCATGGAGTCCAGGTCCAGCTCCCCAAAGGGCAGGGGCAACCGCATGCCCAGTGGGTACTGCACGGAGCTGTAGG +>ENSE00001754010 +CCACTTAAATACAAACTTTATTCTCTCTCCAAGAAGATGCAGACGTCACAGGTGGCCCTGAGCTCCCACCCGAGGCTTAGGCCCAAGGGGCCTCTTCCAGGCTGAGGGCCTGCTGGGGCTGGGCCAGGGGCTGAGGCTGAAAGCAGCAGCCTGCCTAGTGGGTGACGCCAGGGGCCGGTGTAACATGGCACCGAGGTTGGGGCCACAGCAATGTGTGGGACGGTGGGGTGGGCTGGGGCCCTTGGCTCCAAGCATTAGTTCTCCAAGCTCTGGTCCGTTCTCCTACCTCCTTCAAGGGGCACCAGGGCTACAAGGTGGTAGTTGAGTATTGGGGCCCGACTCCTGGGGCACTGGAGTGGTCTCTAGGCCCGAGGCCCCAAGGAGAGGGCTGGGTTTCTGGGAGAGTGCTGGTCCTTCCTCTCTGGGCTTGGCCATCTTGACAGCTTCATCGTAGGAGGGTGGAGGCTCCGGGGTGTACAGGCTGTAGGCAGGAGGAGCCATGGAGTCCAGGTCCAGCTCCCCAAAGGGCAGGGGCAACCGCATGCCCAGTGGGTACTGCACGGAGCTGTAGG +>ENSE00001478051 +TTAGTTCTCCAAGCTCTGGTCCGTTCTCCTACCTCCTTCAAGGGGCACCAGGGCTACAAGGTGGTAGTTGAGTATTGGGGCCCGACTCCTGGGGCACTGGAGTGGTCTCTAGGCCCGAGGCCCCAAGGAGAGGGCTGGGTTTCTGGGAGAGTGCTGGTCCTTCCTCTCTGGGCTTGGCCATCTTGACAGCTTCATCGTAGGAGGGTGGAGGCTCCGGGGTGTACAGG +>ENSE00001810932 +GGCACTGGAGTGGTCTCTAGGCCCGAGGCCCCAAGGAGAGGGCTGGGTTTCTGGGAGAGTGCTGGTCCTTCCTCTCTGGGCTTGGCCATCTTGACAGCTTCATCGTAGGAGGGTGGAGGCTCCGGGGTGTACAGGCTGTAGGCAGGAGGAGCCATGGAGTCCAGGTCCAGCTCCCCAAAGGGCAGGGGCAACCGCATGCCCAGTGGGTACTGCACGGAGCTGTAGG +>ENSE00003350147 +AGGTCCAGCTCCCCAAAGGGCAGGGGCAACCGCATGCCCAGTGGGTACTGCACGGAGCTGTAGG +>ENSE00003428438 +AGGTCACAGTGCTGTGTACAGGGCTGTCACTGTCCATAGGGATGACTGCCACGTCGCAGGGCTGCCGTGCTGGTGGCAGATGTGGCTGGGCCTGTGCCTGCTTCCGGAGGCAGCAGAACCGGACACAACCAGCTGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGCCTAGGAGAGCAAGGCTCTACCACTGGACTGACCCTCGGCCACCGGGCACCTGCACCCTGGGGAATGTCGTGGCACAACCACCGAAGACAGGTTAACAGGATAAAAAGCAGACAATGTCTCTCCATGTCGGAGACCGCCGTGGCCAGAGCCTGGCCTCGGGCTGCTGGGCCTGCCCTGGCTATCTCTCCTGGGCTGGCCAGGGGTGGCCTTGGGCTCACTCCCAGGACTCGCTGTCCTCAGCGAGTGCCCCACTGCTGAGCGGGATCGTAGGGGACTCCCGCGGAGGCCAGGCGGGAGAGGTGGGAGGGAAGGTCCTGCTTGCTCCAGGTCAGTTCCCGCCAGCGGCCGGGACTGGGCGACAGCGGAGGCGGCCTGGTGAGGTAAGGGCCTGGCGGGCCTGGCCCCGGTGACCCCCGCCCCAGAACCGTCGGACGCACGGCTCCGCCGCGGCCTCCACTTACCCCACGTGCCACAGGCTGCTCCAGCGGGCCTGGGGCGGGCAC +>ENSE00003652520 +AGGTCACAGTGCTGTGTACAGGGCTGTCACTGTCCATAGGGATGACTGCCACGTCGCAGGGCTGCCGTGCTGGTGGCAGATGTGGCTGGGCCTGTGCCTGCTTCCGGAGGCAGCAGAACCGGACACAACCAGCTGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGC +>ENSE00003675447 +AGGTCACAGTGCTGTGTACAGGGCTGTCACTGTCCATAGGGATGACTGCCACGTCGCAGGGCTGCCGTGCTGGTGGCAGATGTGGCTGGGCCTGTGCCTGCTTCCGGAGGCAGCAGAACCGGACACAACCAGCTGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGC +>ENSE00001858191 +AGGTCACAGTGCTGTGTACAGGGCTGTCACTGTCCATAGGGATGACTGCCACGTCGCAGGGCTGCCGTGCTGGTGGCAGATGTGGCTGGGCCTGTGCCTGCTTCCGGAGGCAGCAGAACCGGACACAACCAGCTGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGCCTAGGAGAGCAAGGCTCTACCACTGGACTGACCCTCGGCCACCGGGCACCTGCACCCTGGGGAATGTCGTGGCACAACCACCGAAGACAGGTTAACAGGATAAAAAGCAGACAATGTCTCTCCATGTCGGAGACCGCCGTGGCCAGAGCCTGGCCTCGGGCTGCTGGGCCTGCCCTGGCTATCTCTCCTGGGCTGGCCAGGGGTGGCCTTGGGCTCACTCCCAGGACTCGCTGTCCTCAGCGAGTGCCCCACTGCTGAGCGGGATCGTAGGGGACTCCCGCGGAGGCCAGGCGGGAGAGGTGGGAGGGAAGGTCCTGCTTGCTCCAGGTCAGTTCCCGCCAGCGGCCGGGACTGGGCGACAGCGGA +>ENSE00001682091 +TGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGC +>ENSE00003599669 +CCCACGTGCCACAGGCTGCTCCAGCGGGCCTGGGGCGGGCAC +>ENSE00003634508 +CCCACGTGCCACAGGCTGCTCCAGCGGGCCTGGGGCGGGCAC +>ENSE00001937932 +CCCACGTGCCACAGGCTGCTCCAGCGGGCCTGGGGCGGGCACCTGTGGGGACGGCGGCACCTGGAGCAGGCGGGGCATGGGACGGCCGACCTCGCCACCCGTGCCTCCCCATAGGGCGGGGCCAGGCCCCGGCTCCCTCCCCCCCGACTTACTGGTCCGAGGGGTCGCAGCTGCCGTCCGCGAAGCCCAGCGCCAC +>ENSE00001767147 +TGGTCCGAGGGGTCGCAGCTGCCGTCCGCGAAGCCCAGCGCCACCTGTGGGGACAAGGGTGAGCCCGGGAGGGGCGTGGTCCGAGCAGGGACCCGCCCCGCGGTGGCCGAACCGAGAGAGAACGCCGCCCGACCCACCTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGCAGCAGCCGCAGTCCGCGGGCGGCCAGCGGCCCCCGGGCCATGCTC +>ENSE00001736550 +TGGTCCGAGGGGTCGCAGCTGCCGTCCGCGAAGCCCAGCGCCACCTGTGGGGACAAGGGTGAGCCCGGGAGGGGCGTGGTCCGAGCAGGGACCCGCCCCGCGGTGGCCGAACCGAGAGAGAACGCCGCCCGACCCACCTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGCAGCAGCCGCAGTCCGCGGGCGGCCAGCGGCCCCC +>ENSE00003473336 +TGGTCCGAGGGGTCGCAGCTGCCGTCCGCGAAGCCCAGCGCCAC +>ENSE00003561172 +TGGTCCGAGGGGTCGCAGCTGCCGTCCGCGAAGCCCAGCGCCAC +>ENSE00003343061 +CTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGCAGCAGCCGCAGTCCGCGGGCGGCCAGCGGCCCCCGGGCCATGCTC +>ENSE00003293243 +CTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGCAGCAGCCGCAGTCCGCGGGCGGCCAGCGGCCCCCGGGCCATGCTCT +>ENSE00001239803 +CTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGCAGCAGCCGCAGTCCGCGGGCGGCCAGCGGCCCCCGGGCCATGCTCTGAG +>ENSE00003475992 +AGGCAGATTGAAATGCTGACTTTCTCACTGTTTCATTTTGTGATTGAAGTGCGTGCAAAACACTCAATCTGGTAGGGATGATGCCCGCGCGGAGCTGACCCTTCTCCTATTGTTTTTCCAAGCTGGAGAAGAAGCAGGCGCTCCCTCCATTCCAGCCACAGATCACAGACGACTACGGTCTGGACAACTTTGACACACAGTTCACCAGCGAGCCCGTGCAGCTGACCCCAGACGATGAGTGAGTCCCACTGGGTGCGGGTCCCTGGAGCACCCCTCGGGCAGCCCCATGGCAGGCCGGCACCTTGGGCAGCTGGTGACCCAGCCTGCCCTTGAGTCCCACCCGCCTGGTGTCATCTCTCCAGTGGGCGTTGGGGGAGGATTCTTATGCGAACGTGACTCCGCTTCCCCCAAGGGAATGAACACACGGTCACCCCCCTCCCCCCTGCCACCTTTGCCCACAGGGATGCCATAAAGAGGATCGACCAGTCAGAGTTCGAAGGCTTTGAGTATATCAACCCATTATTGCTGTCCACCGAGGAGTCGGTGTGAGGCCGCGTGCGTCTCTGTCGTGGACACGCGTGATTGACCCTTTAACTGTATCCTTAACCACCGCATATGCATGCCAGGCTGGGCACGGCTCCGAGGGCGGCCAGGGACAGACGCTTGCGCCGAGACCGCAGAGGGAAGCGTCAGCGGGCGCTGCTGGGAGCAGAACAGTCCCTCACACCTGGGCCCGGGCAGGCCAGCTTCGTGCTGGAGGAACTTGCTGCTGTGCCTGCGTCGCGGCGGATCCGCGGGGACCCTGCCGAGGGGGCTGTCATGCGGTTTCCAAGGTGCACATTTTCCACGGAAACAGAACTCGATGCACTGACCTGCTCCGCCAGGAAAGTGAGCGTGTAGCGTCCTGAGGAATAAAATGTTCCGATGATGTGGAAGCTCCTCTGATGCCTTTTTTCCGTGAGTGGCGCCTGCCCCACATCTCAGACGCAACCCACACGTAGGGGGGCAGCTTAGGAGCCAGCGGGACACAGGTGGGGGCGGGAGTTGAAGTAC +>ENSE00001817609 +CAGATTGAAATGCTGACTTTCTCACTGTTTCATTTTGTGATTGAAGTGCGTGCAAAACACTCAATCTGGTAGGGATGATGCCCGCGCGGAGCTGACCCTTCTCCTATTGTTTTTCCAAGCTGGAGAAGAAGCAGGCGCTCCCTCCATTCCAGCCACAGATCACAGACGACTACGGTCTGGACAACTTTGACACACAGTTCACCAGCGAGCCCGTGCAGCTGACCCCAGACGATGAGTGAGTCCCACTGGGTGCGGGTCCCTGGAGCACCCCTCGGGCAGCCCCATGGCAGGCCGGCACCTTGGGCAGCTGGTGACCCAGCCTGCCCTTGAGTCCCACCCGCCTGGTGTCATCTCTCCAGTGGGCGTTGGGGGAGGATTCTTATGCGAACGTGACTCCGCTTCCCCCAAGGGAATGAACACACGGTCACCCCCCTCCCCCCTGCCACCTTTGCCCACAGGGATGCCATAAAGAGGATCGACCAGTCAGAGTTCGAAGGCTTTGAGTATATCAACCCATTATTGCTGTCCACCGAGGAGTCGGTGTGAGGCCGCGTGCGTCTCTGTCGTGGACACGCGTGATTGACCCTTTAACTGTATCCTTAACCACCGCATATGCATGCCAGGCTGGGCACGGCTCCGAGGGCGGCCAGGGACAGACGCTTGCGCCGAGACCGCAGAGGGAAGCGTCAGCGGGCGCTGCTGGGAGCAGAACAGTCCCTCACACCTGGGCCCGGGCAGGCCAGCTTCGTGCTGGAGGAACTTGCTGCTGTGCCTGCGTCGCGGCGGATCCGCGGGGACCCTGCCGAGGGGGCTGTCATGCGGTTTCCAAGGTGCACATTTTCCACGGAAACAGAACTCGATGCACTGACCTGCTCCGCCAGGAAAGTGAGCGTGTAGCGTCCTGAGGAATAAAATGTTCCGATGATGTGGAAGCTCCTCTGATGCCTTTTTTCCGTGAGTGGCGCCTGCCCCACATCTCAGACGCAACCCACACGTAGGGGGGCAGCTTAGGAGCCAGCGGGACACAGGTGGGGGCGGGAGTTGAAGTAC +>ENSE00003589214 +GACTTTCTCACTGTTTCATTTTGTGATTGAAGTGCGTGCAAAACACTCAATCTGGTAGGGATGATGCCCGCGCGGAGCTGACCCTTCTCCTATTGTTTTTCCAAGCTGGAGAAGAAGCAGGCGCTCCCTCCATTCCAGCCACAGATCACAGACGACTACGGTCTGGACAACTTTGACACACAGTTCACCAGCGAGCCCGTGCAGCTGACCCCAGACGATGAGTGAGTCCCACTGGGTGCGGGTCCCTGGAGCACCCCTCGGGCAGCCCCATGGCAGGCCGGCACCTTGGGCAGCTGGTGACCCAGCCTGCCCTTGAGTCCCACCCGCCTGGTGTCATCTCTCCAGTGGGCGTTGGGGGAGGATTCTTATGCGAACGTGACTCCGCTTCCCCCAAGGGAATGAACACACGGTCACCCCCCTCCCCCCTGCCACCTTTGCCCACAGGGATGCCATAAAGAGGATCGACCAGTCAGAGTTCGAAGGCTTTGAGTATATCAACCCATTATTGCTGTCCACCGAGGAGTCGGTGTGAGGCCGCGTGCGTCTCTGTCGTGGACACGCGTGATTGACCCTTTAACTGTATCCTTAACCACCGCATATGCATGCCAGGCTGGGCACGGCTCCGAGGGCGGCCAGGGACAGACGCTTGCGCCGAGACCGCAGAGGGAAGCGTCAGCGGGCGCTGCTGGGAGCAGAACAGTCCCTCACACCTGGGCCCGGGCAGGCCAGCTTCGTGCTGGAGGAACTTGCTGCTGTGCCTGCGTCGCGGCGGATCCGCGGGGACCCTGCCGAGGGGGCTGTCATGCGGTTTCCAAGGTGCACATTTTCCACGGAAACAGAACTCGATGCACTGACCTGCTCCGCCAGGAAAGTGAGCGTGTAGCGTCCTGAGGAATAAAATGTTCCGATGATGTGGAAGCTCCTCTGATGCCTTTTTTCCGTGAGTGGCGCCTGCCCCACATCTCAGACGCAACCCACACGTAGGGGGGCAGCTTAGGAGCCAGCGGGACACAGGTGGGGGCGGGAGTTGAAGTAC +>ENSE00001635485 +CAGTCCCTCACACCTGGGCCCGGGCAGGCCAGCTTCGTGCTGGAGGAACTTGCTGCTGTGCCTGCGTCGCGGCGGATCCGCGGGGACCCTGCCGAGGGGGCTGTCATGCGGTTTCCAAGGTGCACATTTTCCACGGAAACAGAACTCGATGCACTGACCTGCTCCGCCAGGAAAGTGAGCGTGTAGCGTCCTGAGGAATAAAATGTTCCGATGATGTGGAAGCTCCTCTGATGCCTTTTTTCCGTGAGTGGCGCCTGCCCCACATCTCAGACGCAACCCACACGTAGGGGGGCAGCTTAGGAGCCAGCGGGACACAGGTGGGGGCGGGAGTTGAAGTAC +>ENSE00003459358 +CCCTCAGGTGAAGGCACAGCTGTCCAGAGCTGAGGCTTCCTAGAGGCAGGGCTGCCAGCTGCCAGGTGTCAGGTGTGGCAGAGCCGTCTTCTGAGCTCCCTGGGAGAGGGGGTCGCGCCACCTCATGCCTCTGAGTGAGGCCTGGTGCACAGGTGTGGAAATTGCCACGCAGCCCTCTTGGCCAGGCGCAGAGACCCCAGGCCTCCATGACTCAGGGGCCGCTCCACCCCATTGTGCGGCTGGTGG +>ENSE00003626371 +CTAAATACTGCCGTGTTGCCAGTAGCGTGCCGGTTACCAGTTTGGCCGTTCTTGTACACAATATGTGAGTAATGCTGTGCTCATCAGAGGGGAGACTTTTATATTCAGTAATTTGTTTTATAAATTAAAGTGAAGGATGTATTGAAGTGTGGTTTGAAAAATCCTGATATTTGCTAATGGCTCCGGTCACGACGGTGTCTTTTGGAAGTGGTTCTCGAAAACTCTGGTGACTTGGGGGCTGCACAGTGGGCCTGCGTGGGCGTGGTGCGGGGCAACTGCCCATGGAGCCCGTGGCTGGCCGGCTCTCCTGTGGATGACACTCACCCTTGACTGCCAGGGTCATTCAAAGTCTTGCACATCCATGAAAGA +>ENSE00003526713 +CTAAATACTGCCGTGTTGCCAGTAGCGTGCCGGTTACCAGTTTGGCCGTTCTTGTACACAATATGTGAGTAATGCTGTGCTCATCAGAGGGGAGACTTTTATATTCAGTAATTTGTTTTATAAATTAAAGTGAAGGATGTATTGAAGTGTGGTTTGAAAAATCCTGATATTTGCTAATGGCTCCGGTCACGACGGTGTCTTTTGGAAGTGGTTCTCGAAAACTCTGGTGACTTGGGGGCTGCACAGTGGGCCTGCGTGGGCGTGGTGCGGGGCAACTGCCCATGGAGCCCGTGGCTGGCCGGCTCTCCTGTGGATGACACTCACCCTTGACTGCCAGGGTCATTCAAAGTCTTGCACATCCATGAAAGA +>ENSE00001862783 +GACGTTTCATCACAACACAGAGACAGACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGCCTGCAAGGGAGGGGCCACACTCACTCGGCCACCTCCGCGGCATGCTGGCCGCAGAGAGCACCGTCTGGACCTCCGGGCCCTCTCTGCTCCTGCCGCTGGAGAGGATCCGGCTGGTCAGAAACAAGGGACGGGGCCACCCCAGGGGCTCATGCACCCGGCAGACCACGGTAACCGCCAGTGGTGTTTCCACACCGTGCCCGTGAGGAGGCCACGCCAGGCCCCTGCGTCCGAGCTGGGGGTGGGGAAGCTGTGTCTCAACAAGCCTCTCTATGGGATTCTGGCGCCTGCTCAGCTTGAGAACGCGCTCATCGTGGAGCCCGGCAGACAGGCGGCCTGACCCGGAGAAAAGGCAGGACGGCGGGTGGCCTGCCAGGGAGAGCCGCCGCGGCTGCGTCTACAGGAGGCAGAAGAGTAAACATGGCTGGGCAGTGGATGTGCAGCTCACGTCAGAGAATTGGTGTTTCTGGCGAGGAGGGACCAAGCCTCACCACGGAGAAGGACGCCGTCACCGGCGTGCAGGCTGCCAACCTGCCACTCTGGGAGGCCCCACGCGGCCCCTGCACCTCTCAGGAGGGCGCTGGCGCTGGGATGGTGGCCGGCCAGGCAGGGGTGGCAGGAGAAAACCCATCCGAGTCCTGCAGGTCAGCGCCCTGGGCATCCAGTGGGGCCGGGAGGGGTGTCTGAGCGCAGCCACCTTCTATCCCCGGCCTCATGTGGCCCCATCAGCCCAACTGGAGCGGCTGGAAATGACCATCACCAGGCCTGGCCAAGGTGTGGCCCTGGAAGCCAGGACAGTTGACTTCCGGCCATGACTCCCGGAGAGTGCCGGAGCTGGCGTGCTCAGCAGAGCTGCCGGGGACGATGTCCCGGGGCTGAGTGGGCGGCTTCAGCCTAGACTTGGGCCTAGATCTTGCTGGAGGCCAAGTGGTCAGTGTCCCATCAGAGTGACCATCCCTCACACGCCACTGCTGGGGGACACACCCCCACTGAGCGGCCAAGTCCACAGGACACGTGTCCCTGTGTCCACCTGTCAGCCACACCGCCCCTCGCTCCCCTACAGCCTCTGCCCTCAGACCAGTCCACGGCGCGCCGTTTTACCCTTGGGCTTTGCTGTGTCCCTTCCTTTGGCTCCTGTGCCCCGTCTGTGTGGCCACTGCAACCCTCAAGTCCCCCTCTCCAGACCATAGCTGGACCCCCACTCCCGGGGCTGGCTCCAGCAGCCATCAGCTGCCTTCTCACTCTGGCAGAGCCCACCCAGTGCCTTCTGAAGCCCCCGAGGGTCACTCAGTCTGAGACTTTCCGGCTTCTGCCCATCCTGGGAACCAGCCCCTCCCTCCAGAAGCTTTCTCTAAGGTTGCCAGAAGGTGCTAAGATCTGAACCGAGGTCATCTTGTCCCGGGGTTTCCAGGCAGCGTCCCTTGTTTGGGGGCCCTCTGAGATGCCTTCAGACCCCCGCCTGTGGCGGAAGAGCTTTGTCCTGGCCTGATCTGCCCTGTCCGTGACGCTTCTGCTCAGTAGCTGAGCACGCCCTGTGGTGTGGACAGGCCAGCCCGGCTGCAGGACAGTGGGGGCTCAGTCCAGAAGCCTCTGGTGGCTTCTGCGTGTGGGCAGGGGAGCAGGGCTGCAGGGTGGGCTGGCACCTGGCAGCGTGAGGGGCCTCAGGGCTGTTAAAATCCCAACGACCGGCCGGGCGCGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAGACGGGCGGATCACCTGAGATCAGTTCAAGACCAGCCTGACCAACATGGTGAAACCCTGTCTCTACTAAAAATACAAAAATTAGCCAGGTGTGGTGACGCCTGTAATCCCAGCTACTCAGGAGACTGAGGCAGGAGAATCGCTTGAACCCGGGAGGCAGATGTTGCAGTGAGCCGAGATCATGCCACTGCACTCCAGCCTGGGCGACAGAGCGAGACACCGTCTCAAAAAAAAAAAAAAATCCCAGTGACCAACCCAGGGCCTCGCCACATCAACAGAGACAAAACGCAGCTCTGGCTCTCAACATCCTCACCCCTCACCAGGTGCCCAGCTTCCCATCCACCCACGTGACCCGCAGGTGTCTGAAAATGCACAAAATGTCCAAATAGGACCACAAGAAGATCTTAAAGACACAAAGAACATTCTACATAGTTTGTCAAATCCAGCATTTGACGGTCCTCTGGGTGACCCGGAGAACACCAAGGCTGTGAGAAATGGGAGGCCTCCTGGCAGCTCCACTCCCCAGACCCGCCTCTGCCAGGGCTCCAGGCTCAGCAGGCGCCTGTGCGGGACAGGGCGACGGTTCAAGACCAAGTCCGGCTGTTAGACCAGACCCTCCAATCCAGGCGGCCTCCCTGCTGGGGTCCTGTGCGGTCAGGAGTCCCAGGGCATCCCAGGGTGGCTGTGCAAACCCTTGTTCCCAAAGATATGGGGCTTGTCCCCCAGCTAGCCTGCCCATGCGGTGGCCACAGCCTCGGGTGAGTTCCGGTTCCAAAGTACCGGCTCTCCCTTACGATCAAGTGTTCGAATGTGCTTGAAGCATTCCAGACACACCAAGGCCTGGACCTGACTTCATTGACGCCTACTTAGGAAAAATTGAGGCAGTCTGCCAAGCTTTCAGCAACTGCTTAAAAAGCTCAAAATGGCAAGTTTTTCCTCGTGAACGTCCTTGTCTTCAGAAGTCTTTTTTTAGACTATCTGGAAAAGCAGGCGATGCAAAGACAAAAGCCCCTCCCCGGGGGGCGGGGGGCAGCACCCTGACAGCAACAAGGATCTCAGAGCTTCAGCCAAGAGCATGGATTTCTCCCCAGGGCTCCCAACAGTACCCTCTGTCCGTGATTCAGGGTCTTACTCTGTCACCCAGGCTGGAGTGCAGTGGTGCAATCATACTTCACTACAGCCTCCAATTCCTGGCTCAAGGGAATCCTCCCACTTCAGCCTCCAGAGTAGCTAGGACCACAGGCACGCGCCACCACGCCCAGGCATGTAAAGATGGGATCTTGCCATGTTGCCCAGGCTGGTCTCAAACTCCTGGGCTCCAGCAACCCACCTGCCTCAGCCTCTCAAAGGGCTGGGATTACAGGCGTGAGCCACCGTGCCCGGCCTTTTCTTTTGTTGTTGTTGTTGTTGGCTGCCAACTTTGGACTCCGGTGCCTTCGCATTCCCGAGCTGTTTTTGCTTCTGGAAGACCAGGGGCATCAGGCATGACTGAAGGACCTGGTCTCCATAAGCTCTGAAACCTGCCGCCCATTAACTCAACCAAAAGTTACGAACCAGCATCATTCACACCACCCCAGCCCCAGGACCTGCTCCGGAGGCCAAGGGCCCAGAGGTCGCCAGACACAAGGCCAGGCACTGGGCAGTTTGGGTTATCTTGTTAGCAAAACTGGGTTCCATTCCCCTTTACTTAAAAAATACATAAAAATATACGTTGGGTTTCAAAAATAAGAAAAAGCATCTCCAGACAAAAAAGACGATCTTCATTTTTAAAACCCATGACGCACTCTCGGGAAGGTGTTCCTGTGCTCTGGGCCTGGGGACGCTGGTGCCACCAGATTCCAGGATGGCCAGGTGGACCCGGGGCCAGTGCTCCCAGCCTTCCTTCTGTGCTGTTCTGTGGGCCCCCAGCCTGCCCTGCCCACAGAGCACGGCAAGCAGGTGGACCCCAGACCCGTGACAGAGAGCCACCTGGACATGCCAGGCCACAGCACTGGGCCACCTTTCCAGTGTGAAACAGGGCTTTAAAAGCCAGCGCTGAGCTCGGCCACCTCTTGACCTTCTGAACGGCTGTGGTTTCCAAACACGGATGGATAACCGGGCCGGGCGCAGGGGTGGCCTACTCACCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTC +>ENSE00003569320 +TTTCATCACAACACAGAGACAGACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGC +>ENSE00003681657 +TTTCATCACAACACAGAGACAGACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGC +>ENSE00003483048 +TTTCATCACAACACAGAGACAGACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGC +>ENSE00001951400 +GACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGC +>ENSE00002033745 +GCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGC +>ENSE00003636009 +CACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGC +>ENSE00003529933 +CACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGC +>ENSE00001602311 +TAGGACCACAAGAAGATCTTAAAGACACAAAGAACATTCTACATAGTTTGTCAAATCCAGCATTTGACGGTCCTCTGGGTGACCCGGAGAACACCAAGGCTGTGAGAAATGGGAGGCCTCCTGGCAGCTCCACTCCCCAGACCCGCCTCTGCCAGGGCTCCAGGCTCAGCAGGCGCCTGTGCGGGACAGGGCGACGGTTCAAGACCAAGTCCGGCTGTTAGACCAGACCCTCCAATCCAGGCGGCCTCCCTGCTGGGGTCCTGTGCGGTCAGGAGTCCCAGGGCATCCCAGGGTGGCTGTGCAAACCCTTGTTCCCAAAGATATGGGGCTTGTCCCCCAGCTAGCCTGCCCATGCGGTGGCCACAGCCTCGGGTGAGTTCCGGTTCCAAAGTACCGGCTCTCCCTTACGATCAAGTGTTCGAATGTGCTTGAAGCATTCCAGACACACCAAGGCCTGGACCTGACTTCATTGACGCCTACTTAGGAAAAATTGAGGCAGTCTGCCAAGCTTTCAGCAACTGCTTAAAAAGCTCAAAATGGCAAGTTTTTCCTCGTGAACGTCCTTGTCTTCAGAAGTCTTTTTTTAGACTATCTGGAAAAGCAGGCGATGCAAAGACAAAAGCCCCTCCCCGGGGGGCGGGGGGCAGCACCCTGACAGCAACAAGGATCTCAGAGCTTCAGCCAAGAGCATGGATTTCTCCCCAGGGCTCCCAACAGTACCCTCTGTCCGTGATTCAGGGTCTTACTCTGTCACCCAGGCTGGAGTGCAGTGGTGCAATCATACTTCACTACAGCCTCCAATTCCTGGCTCAAGGGAATCCTCCCACTTCAGCCTCCAGAGTAGCTAGGACCACAGGCACGCGCCACCACGCCCAGGCATGTAAAGATGGGATCTTGCCATGTTGCCCAGGCTGGTCTCAAACTCCTGGGCTCCAGCAACCCACCTGCCTCAGCCTCTCAAAGGGCTGGGATTACAGGCGTGAGCCACCGTGCCCGGCCTTTTCTTTTGTTGTTGTTGTTGTTGGCTGCCAACTTTGGACTCCGGTGCCTTCGCATTCCCGAGCTGTTTTTGCTT +>ENSE00001720216 +TCTGTCACCCAGGCTGGAGTGCAGTGGTGCAATCATACTTCACTACAGCCTCCAATTCCTGGCTCAAGGGAATCCTCCCACTTCAGCCTCCAGAGTAGCTAGGACCACAGGCACGCGCCACCACGCCCAGGCATGTAAAGATGGGATCTTGCCATGTTGCCCAGGCTGGTCTCAAACTCCTGGGCTCCAGCAACCCACCTGCCTCAGCCTCTCAAAGGGCTGGGATTACAGGCGTGAGCCACCGTGCCCGGCCTTTTCTTTTGTTGTTGTTGTTGTTGGCTGCCAACTTTGGACTCCGGTGCCTTCGCATTCCCGAGCTGTTTTTGCTT +>ENSE00003630334 +CTGCCTCAGCCTCTCAAAGGGCTGGGATTACAGGCGTGAGCCACCGTGCCCGGCCTTTTCTTTTGTTGTTGTTGTTGTTGGCTGCCAACTTTGGACTCCGGTGCCTTCGCATTCCCGAGCTGTTTTTGCTT +>ENSE00003481862 +CTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTC +>ENSE00003510741 +CTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTC +>ENSE00003548540 +CTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTC +>ENSE00003634783 +CTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCACCGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAGAAACCAGGGGCGGCCGCCAGAAGGC +>ENSE00003467961 +CTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCACCGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAGAAACCAGGGGCGGCCGCCAGAAGGC +>ENSE00001841545 +CTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCACCGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAG +>ENSE00001816369 +CTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCACCGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAGAAACCAGGGGCGGCCGCCAGAAGGCCTGGGGCAGACAGAGAGGGCAGACAGGGGGTACTCAGTAGCGGAAACGCTATGGTGGGGAGACCCGGGAGGGCCTGGGGC +>ENSE00003618179 +CCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCC +>ENSE00001545345 +CCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCCA +>ENSE00001822711 +CCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCCATCCAAGCCCGCGCCGGGCGGAAGTGA +>ENSE00002226200 +CCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCCATCCAAGCCCGCGCCGGGCGGAAGTGAG +>ENSE00001477870 +CCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCCATC +>ENSE00001816144 +CCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCCATCC +>ENSE00001720995 +CCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCG +>ENSE00002040955 +CTTGTCCTGCCTGTCCTCAAGTTATCAGCATGACACAGCGGTGCTGGTGATGGTGATGGTGGAGGTTTCAAAGTTGAACCTGATGAAAACGCTCCACTTCTTCGGAGCCATCTGCTGCTGTGGTGACGGAGTTTTGCTTTATTGGAAAATAATTTCTGGTTGGGACTGACACGTGCACAGTGGAAATGAGTTTTTTCTAAGCCAAAATTCATGTTTACAAAAGAACGTTTCAGCTGTGGGAGTTTGCATCCCAGGCAGAGCAGAAGGTGATCGAGTGGGTGGGGGCATCAGAGCCACCCATCTCCTACTCCCGCACCTGCAGACCGGTGGGCTAGGAGGCCCCTTACCCTCTGTGGCAAAAAAGGACACATTTATGGATGATGAATCAGGCCCCAGCCCACTGAGCTGGTTTCAGAAGCCAGGCTGGCCGTAGGTCAGGGAGCCAGGCCTCTCCAACTCCTTCCACCGCGGAAGAACAAGTGTCCCAGCCACTGGCATCCTCAGAGTCACCCAAATGTTCATCTCTGCCCAGCGCTGACACCCTGCAAATCAGGCTAAGACAGCGGTGACGGGCCCTGAGGCTGGCAGGCCTAAGCAGCCCGGTGGCCGTGCACCCTCCCAATTTCCAAATGAGACCTGTGGCCGACAGGCACCCTGGGCACATGCTGAAGGCACTGGGCTGCCTCCACCCCTTCCCATGTGGCTAAATGGCCCAGCACCCACACACGGTGCCCTGGCAGTGCTCACCTGCTGGCAAGGACAGCCAAAAGGCCCGGGCAGCCTTCTGACGCAGCCAGGAACTGGGCTGTGCTCCACCACACCTGCTGGCCCGTGGATGCCAGGCAGGCACGCCCACCCATAGCCAGATGTGGTGGCATTTATGGGATACGGGAGTGCCAGGCAGACAGGCTGTGAGAGACAGTTGCCTGGGAAACATCGCCAGATCTTTGGGGCAGCAGAGCAGGTGCTCGGGCCCACACATGGGGTGCAAGAGTAGGGGTGTGCCTTGGTGCCCTTGGGCACCGACAGCCTCCTCACAGCCTCAGTGGCGGGGTCATGGCACAGGCCTGCCCCTGACCCCAAGAACCAGAAAGCCAGGAGCAGCTGGGGAGGGCCCTGGCCCGGGAGAGACAGCGGTCCTGTTTCTGAACCCCATCCCAGCCATGGCCTGTGTCTGGGCCAGCATCCCCGACCAGACAGGGCCAGCCGCCCTCTCTCAAAGTCCCCAGCACCCCTTCAAGCAGTATCCGGTTCACACCCTCCCACAGCCTGTCCTCCATCCCCACGTGTCGGGCTCAGCTTCCGCACCACTCAGCCCCCACCCAGGGGCGGGCTTTTATCAGCCCCAGATCCTGCTCTGACGTCCCCCCGCCCGGAGAAGCTTCCCCAGCCCAGCCCAGCCCAGCCCAGCCCAGGCTTCTCTCTCCACCCCACTGCCCTGCTGGGAAATTGTGAGCTCAGATGCTGATTGGTCTACCCAGGAGGGCGGTCCTGTGTGCTCTGTTCCCTGGGAAGCCTCTCAGAGTGCGCGGCACCAAGGAGCCGGTCAGGGAGTGGAGACCTCTCAGGGCACCCCTCCTCTGGGGAAGGCAAGTCACAGAAACCAAGCTGGAGGAGCACTGTGGGTTGAGCAGCGTCTCCGAAGACTCATGTCCACCAGTACCTGAGAAAGTGGCCTCGCTCGGAAGCAAGGTCTGTGCCGATATAATCAAACCAGGATGAGGCGATACTGGGTTAGGGTTGGCCCTGAATGCAGTGTGAGCAGTGTTCTTGTAAGAAAAGGAAAATTGTCCGGGTGCAGTGTCTCACGCCTGCAATCCCAGCACTTTGGGAGGCCGAGGCGGGCAGATCACTTGAGGTCAGGAGTTCTAGACCAGCCTGGCCAACATAGTGAAACCCCG +>ENSE00003615416 +CTTGTCCTGCCTGTCCTCAAGTTATCAGCATGACACAGCGGTGCTGGTGATGGTGATGGTGGAGGTTTCAAAGTTGAACCTGATGAAAACGCTCCACTTCTTCGGAGCCATCTGCTGCTGTGGTGACGGAGTTTTG +>ENSE00002044438 +TGGTGGAGGTTTCAAAGTTGAACCTGATGAAAACGCTCCACTTCTTCGGAGCCATCTGCTGCTGTGGTGACGGAGTTTTG +>ENSE00001853635 +CTGCTGGCAAGGACAGCCAAAAGGCCCGGGCAGCCTTCTGACGCAGCCAGGAACTGGGCTGTGCTCCACCACACCTGCTGGCCCGTGGATGCCAGGCAGGCACGCCCACCCATAGCCAGATGTGGTGGCATTTATGGGATACGGGAGTGCCAGGCAGACAGGCTGTGAGAGACAGTTGCCTGGGAAACATCGCCAGATCTTTGGGGCAGCAGAGCAGGTGCTCGGGCCCACACATGGGGTGCAAGAGTAGGGGTGTGCCTTGGTGCCCTTGGGCACCGACAGCCTCCTCACAGCCTCAGTGGCGGGGTCATGGCACAGGCCTGCCCCTGACCCCAAGAACCAGAAAGCCAGGAGCAGCTGGGGAGGGCCCTGGCCCGGGAGAGACAGCGGTCCTGTTTCTGAACCCCATCCCAGCCATGGCCTGTGTCTGGGCCAGCATCCCCGACCAGACAGGGCCAGCCGCCCTCTCTCAAAGTCCCCAGCACCCCTTCAAGCAGTATCCGGTTCACACCCTCCCACAGCCTGTCCTCCATCCCCACGTGTCGGGCTCAGCTTCCGCACCACTCAGCCCCCACCCAGGGGCGGGCTTTTATCAGCCCCAGATCCTGCTCTGACGTCCCCCCGCCCGGAGAAGCTTCCCCAGCCCAGCCCAGCCCAGCCCAGCCCAGGCTTCTCTCTCCACCCCACTGCCCTGCTGGGAAATTGTGAGCTCAGATGCTGATTGGTCTACCCAGGAGGGCGGTCCTGTGTGCTCTGTTCCCTGGGAAGCCTCTCAGAGTGCGCGGCACCAAGGAGCCGGTCAGGGAGTGGAGACCTCTCAGGGCACCCCTCCTCTGGGGAAGGCAAGTCACAGAAACCAAGCTGGAGGAGCACTGTGGGTTGAGCAGCGTCTCCGAAGACTCATGTCCACCAGTACCTGAGAAAGTGGCCTCGCTCGGAAGCAAGGTCTGTGCCGATATAATCAAACCAGGATGAGGCGATACTGGGTTAGGGTTGGCCCTGAATGCAGTGTGAGCAGTGTTCTTGTAAGAAAAGGAAAATTGTCCGGGTGCAGTGTCTCACGCCTGCAATCCCAGCACTTTGGGAGGCCGAGGCGGGCAGATCACTTGAGGTCAGGAGTTCTAGACCAGCCTGGCCAACATAGTGAAACCCCGTCTCTACTAAAAAACACAAAAATTAGCTGGGTGTGGTGGTGGGCGCCTGTAGTCTCAGCTACTCGGGAGGCTGAGGCAGGAGAATCGCTTGAACCCAGAAGGCAGAGGTTGCAGTGAGCCAAGATTGTGCCATTTTACTCCAGCCTGGGCAACAGAGCAAGACTCCGTCTCAAAAAAAAAAGAGAGAGAGAAAGAAAAGGAAAATTGGCCAGGTGCTGTGGCTCATGCCTGTAATTTCAGCACTTTGGGAGGCCGAGGCAGGTGGATCATGTGAGGTCAGGAGTTCGAGACCAGCCTGAAAGACATCGTGAAACCCCATCTCTACTAAAGATACAAAATTAGCTGGGTGTGGTGGTGGGCACCTGTAATCCCAGCTACTTAGGAGGCTGAGGCAGGAGAATCGCTTGAACCCAGGAGGCGGAGGTTGCGATAGGCCGAGATCGTGCTGTTGCACTCCAGCCTGGGCGACAAGAGCAAAACTCTATCTCAAAAAAAAAAAAAAAAAGGTAAGGAAAATTTGGACACAGAGACACAGGAAGGAGGCTTTGGGGTTGGGGGTGGAGCAGCTGCACGCCAGGGAATGCCGGGGGCCCGGGGCTGGAAGGGGCAGGCAGCAGCCACCCAGAGCCTTTAGGCGGAGCTCCACCCTCCCAACCACTGATTTTGGACACCAGCTGCCTGAACTGTGAGAATATACATGTCACTCGTTTTAGGCTCCCAGTGTGTGGTCATTTTTTCACAGCAGCCCCAGGAGACACGCAGCAGGCTCCCGGCTTTCCAAGCCGCCACGCACCAAGTTCAGCTTGAAAACGCTGAGCCCAGCTGGGTGCGGGGAGCCCTCGGTCTCCTGTCCACCACACCCGGAGCTGAGGAAGAGGCTCCCCCATGGGCCAAGAGCTGGAAGGGGGCCCTTGGAGGATCCCCCAAGGTCCTCCAAGTGGGCCAGGAAACCTCTGCAGGTGGAGAGGGTGGCTGGGACCCCCTCGGGAGTCCCCAGGGAAGGTCTGGCTTCTCGGCTCTGTAGAATCAGCTTTGTCCCCAGTTCAGCACGTTTTTATGGGAAATCTGCTGGCTGGGGACAGCCCTTGATGTCCTGAGATGAGATGCTGCCTGGTCCCTGCACCTTCCAGGACCCAGCTCACCTGTGGCGCACAGGTTTCCACTTGTCATAGGAAACTGTGCTTGGTGCATCCCCTGTGCAGCCGGCTGTGAACTGTGGGCTCCAACCCTGCTTGGTTTGCTTCAACTTTCTGAGTGACGTGCAGACCTTCACAGAGGAGCCGTGGGGTGGCTCCATCCAACGCCTCCCTCGCTGCCC +>ENSE00001859055 +CTGTGGCGCACAGGTTTCCACTTGTCATAGGAAACTGTGCTTGGTGCATCCCCTGTGCAGCCGGCTGTGAACTGTGGGCTCCAACCCTGCTTGGTTTGCTTCAACTTTCTGAGTGACGTGCAGACCTTCACAGAGGAGCCGTGGGGTGGCTCCATCCAACGCCTCCCTCGCTGCCC +>ENSE00002034769 +CGGTGCAGGCCACCCTGCTGCTCCAGCTCAGTCCAGCACAGGTGTTCTCGCTCTGGGGTTGGCCTGGCGCTGACCTGTGCACCTGACAGGGAAGGTAGGCAGCTCTGGAGCTGGCTGGTGCCCCTCACCTGGGGTGGAGCTGGGGCAGGTCCCACATTTCTCAGAAGGACTCCAGGATGCAGCTGCGTCTGGGGCCTGAGCGGAGGGAAGATATCAGGCTGGGGCCGGCTGCTGGGCCTGTCCTCTCTGAGTTGCCTCAAATCCCCTGTTCCTTGAGCGGTCCTGGAGCCTGGCCTCAGGCCTCAGGGCACCACACTACTTGCCTCCAGGGACCAGCCTGTTCACCCCACACCCAGCCCTGTGACAGAGGTGCTGTCGCGTGGCCCCACTTACAGATGGGTCAACTGAGGCCCGGGGCATCTGTCCACTTGTCATGACAGTGAGCGG +>ENSE00001916683 +CGGTGCAGGCCACCCTGCTGCTCCAGCTCAGTCCAGCACAGGTGTTCTCGCTCTGGGGTTGGCCTGGCGCTGACCTGTGCACCTGACAGGGAAGGTAGGCAGCTCTGGAGCTGGCTGGTGCCCCTCACCTGGGGTGGAGCTGGGGCAGGTCCCACATTTCTCAGAAGGACTCCAGGATGCAGCTGCGTCTGGGGC +>ENSE00001937728 +CTGGGGTGGAGCTGGGGCAGGTCCCACATTTCTCAGAAGGACTCCAGGATGCAGCTGCGTCTGGGGC +>ENSE00001845014 +CTTTTGGAGGGAGTGGCCCAGCTCTCCCGGCCTTTGCCACCCGGCGTCCTGTCCCAGTTTATCTGTGTCCAGTCCGATTGATGGGCTCATGGATTGGAAAGCTGTGACAGACGCCCTGGG +>ENSE00001908868 +CGTGGGGTGGGTGTGATTCTGAGACTAAGGCTCTGGGGGCCGGGCGTGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAGGCGGGCGGATCACGAGGTCAGGAGATCGAGACCATCCTGGCTAACACGGTGAAACCCTGTCTCTA +>ENSE00001934415 +TGGAAACTCCCTGTCTTGGGGCCGCGCACACCATGCCTGGCAGGAGCTGGAGATGCAGCAGAGCAGACGCGGCTGCAGGAGCAGCCGTGTTTCCTACAGTGGAGAAGGGGACCCTGGCAGGAGCACTGCCCAGCCAGGCACGTGGTGCTCAACCCTGTGGGCACTGACCCCACAAAAG +>ENSE00001714381 +TGCTGGGATTACAGGCGTGAGCCACTGCGCCAAGAGCAAGCTTCTGATGTAGGGGCTGCGGGGGGCTTCCCAGGCCAGGCAGGTTGCTGTCTCAGCGCCAGCGTGTAGCCTCCTCCCAGGATCCGGAGCAGGAGGGTGGCTGTCTTTTGCGTTCAATCCGCTGGGCTGCTGTGGGGTTCCCGCAGAGCTGCTCCAAGGGGCCGAGAGAAGGAAGGACGCTGCCCCCAAGGACAGACGGGCAAGCTGGAGTCAGGAGAGGCGCAGCCGTGGCCCACAGGCCTTGGATCT +>ENSE00001821386 +CGAGAGAAGGAAGGACGCTGCCCCCAAGGACAGACGGGCAAGCTGGAGTCAGGAGAGGCGCAGCCGTGGCCCACAGGCCTTGGATCT +>ENSE00001724829 +CTCCAAGGCCTGGGCGGCAGGAAAGG +>ENSE00001927358 +CTCCAAGGCCTGGGCGGCAGGAAAGGGAGAGATGACGTCATTGCCGCCTGGAATCTGCTGTTTGGAGGCGTCGCCATGGAGACCGGAAGGCTCAGGGTGGGTAAAAATAGCAAACCCAAAAGGGTGTAAGTTCCAAGAACGCGAGTCTCTGAAAAGCGAGGCATCCATGTTC +>ENSE00001755234 +TAGTTGTATAAATCAGCAAGTATTTATTTTAAATAATAAAACTACAGTTTTATACCATACATATTTACAAAAATGCTTTGCTATAGAAAAATAGAATCAATCACTGAATCCAGACCACCACAGTGGAGAACCTCCTGGTGAAGCTGTGTTTTTTCCCACACTGGAAACACAGAGTAGCCCTGTTTCTGCACACGTTAGTGCACCGCTGCTACGTGTGGCCGCCCAGCTGTCTGCAGGCTGTGCCGACCACTGCCTCTGTCTCCAGGAAGCAGAGGCAGAAGTGATCCTTGCTGAGGAGGGCCATCGAGTCTCCGCTTAAATGCCAGCACAGAGAGAGCACTGCAAAGTCGCCTAGAGAGAGACAGGTGGCCAGAGGATTACAGCAGGGGAGGCCCAGATTCTGGGGGATGGGCACCCCCTTGTCCTGCAGGCCAGCACAGTGCCTGGAGTGACCCACATAGGCAGAGCCAGGGTGGAGCCCCAGAGCTGCCTCAAGTCAGGGAGAGGCTGCTTCTAGCCCATAAAGCTGAGGGCAGCGGGTCCCCTGTGTGTCCGTCTTGAGGTTTACGCAAAGACTCTGAGGGCAGTTTCCCTGGAGTGCTGCCGGAGACAGCAGCTGGGCTTCAACAGTTCAGCCCGTGTGATGCCAGACTGCACACAGCAAGGCTGCCACGTCCGTGGCCTCGGGGATGTGCTTACCTTCCCCAGGCACCTGCACCGACATGCAGCCCGCTGGGGACCACAGGTAGAGCCTGCTGCCTCCCGTGCAGATGGCCAGCCGCGGCTGCTGCGGGTCCCACTGAAATGCGCGCACTGGGGACAGCTGCTCGAGCACCGCGAACAGCCTCAGCTTCTGAATGTCCCAGACCCAGACGGCATTGGGAATGTTGT +>ENSE00001697450 +TAGTTGTATAAATCAGCAAGTATTTATTTTAAATAATAAAACTACAGTTTTATACCATACATATTTACAAAAATGCTTTGCTATAGAAAAATAGAATCAATCACTGAATCCAGACCACCACAGTGGAGAACCTCCTGGTGAAGCTGTGTTTTTTCCCACACTGGAAACACAGAGTAGCCCTGTTTCTGCACACGTTAGTGCACCGCTGCTACGTGTGGCCGCCCAGCTGTCTGCAGGCTGTGCCGACCACTGCCTCTGTCTCCAGGAAGCAGAGGCAGAAGTGATCCTTGCTGAGGAGGGCCATCGAGTCTCCGCTTAAATGCCAGCACAGAGAGAGCACTGCAAAGTCGC +>ENSE00001797222 +CTTCCCCAGGCACCTGCACCGACATGCAGCCCGCTGGGGACCACAGGTAGAGCCTGCTGCCTCCCGTGCAGATGGCCAGCCGCGGCTGCTGCGGGTCCCACTGAAATGCGCGCACTGGGGACAGCTGCTCGAGCACCGCGAACAGCCTCAGCTTCTGAATGTCCCAGACCCAGACGGCATTGGGAATGTTGT +>ENSE00001862304 +TTTTTTTTTTTTTTTTAGCCCTTTACAAATGGAGAAACCCTTAACAAAAGGCGGGCTGCAGTGTGCCCAGCCCTGCTTTCTACTCAGCAGAGTGGAGCAAGTGAGCAGGGTGGAGGCCTCCTGACTCATGCGCGGACCTGCGGCTGCTGCAGGACAAAGGCCCAGCGCCTCCAAGGAGCTTCTGTGAGCACCTCGGCTACTGCAGAAACGTGAAAGGAGGTGACGTGTCGGAAACCCCCAACTTCATTTTCTTTTCCAGTCGCTTCTACACCTGGGGCCACAGGACACAGTAAAGGGTGAGACAGCACCTGCGTCAGCACAACTGACCGTTCCTTGTCGCCAGGAAGTAGCTGTCAGGACTAAATGCCAGCATTCCTATGCCGATTTTCGGGTTTGCTCTGTCGGTAACAGGTTTCAGTGTCTGTAAGGAGACTGGGACAGAGGCGATCTCATCTAGAACACCAACAGGAAGAACACGCCATTGTCACCCTTTCGGGAAGTACGCACGCGGCTGAGAGGCTGCTGTGCCTGCATCGGGCATCGCGAACCCAGCTCCTCTGTTCAAAGGGGAGGAAAGTGCGGCCCAAGGGCAGGAAGAGCTAAGCAAAGCCTGGCAGCCGCAGCGAGGGGCCTGCCCGCAAGTGCCCCGGATGAGAGTGGCACCATCACCTGCCAGGCCCGACTAGGTGGGGGGTGGACCCCACGTGCCAGGGGCTGACTGGAGAGGGACATGGACAGGTCCTAGCTGCAATCTCAGCAGCTCCAACTCCTCAGCACTTTTCTGTCGACTACCAGCATCTGAGTTCACAATCCCTTCCACCTCAGCGTCAGTACCCTTAGACTTTCCGGCTGTGGAAGAACCATCATCACAGCAGAAGCAGGGGCTGTGGAACAAGGACGCCCCTGGGCTCCTGGGGAGCGCCTCCTGTGTGCCAGGCTGCACCTGTCCTGACCCCCATCCTGAGCACACACCGAGCCCCGGGGTGGGCCCGTCGGCACTTGGGGCACCGCTTCCTCTACCTGCAACCTTCAGATGCCCTCATGCCCCTGTGGGATGGGTGCTTTTACTATGCCCATTTCAGCGATGAGGAAACAGACACATAGGAAATGCCCAGAGTCAAGAGGCTGCATCAGAACCGGGCCTCAAGCCGGAGACAGCGCTCGGGAGCACCGCCGGGTTCCAGACCCACTCTGAGCGCCACCCACGGAAAAGTGTTTCTTTGAAAAACATCATTCTCGGAGCTCCGGAAAAACATCCCCTCGGAGCTCCCGCTGTCAGATCCGGGTCTCCAGGGCTCATATTCAGTAACAGAAGCCGCACCTTCACGGCCCACTGCGCAATTCAGACCCTAGTCAACCTCCAGCCAACAGGCTGAGGGGCACACTGGCTGGAAGCATGGAAGGGAAAAAAAGTTTTTTTTTTTAAACATAAGGAACATCCGAAGTTTATCTGGACAACGAGGAATCTTGCATTAAAAAAGGAAAACAAATGACATCACATGTGCTACTTACATTTACTCTCTGAGCTCGGGAGAGGGCCGGCCCCGGCCCGGGGCGGCGGGAAGGAGAGGCAGCCCAGTCCCAGCTGTGGGCTCTTCTCGGCCTCCTTATACACCACCTGAAAGACACAAGGTGGCCACGCCCGGCTCAGGACAGGGACCCGGAAGCCAAGGATGGACGTGGCAAATGCCCATGACAGCGCATGGTCAACAGGTGTGCCTGCCATGACAGCTGGTCCTGCTGCCACCGGGAGAGACGGAAGCACGAACCCCGCAGTCCCGAGAGCTGAGATCACCCAGCCACCCTCTCTCGTGTCCTGCTGAGGAGCCCACCCTTTGAGACACAGGCAGCAAATGTGTGCCCTGTGATTACAGACGGGAGACCACTGCAGCCACCATCATCCAGCAAGGGAGTGGGCTCAGCCTTCCCTCCGTGATAAGAGGATACAGAGAACACTTGCACCAACACAGCAGAGGCCCCGGGAGCAGCAGACACAGACCCGAGGTGGGGGCATCTGTGCCCGAGAGCCTGGCAAGCAAAGGACAGCGGCCCAGGCTCAGTGGAAGGCGGGCAGCCCCTACGCCCCTGAAGAGCCCCAGGTAAGGGAGTCACCTGGCCTGGTTCATGCCTTTAAAGCATGCTCTGCTGCTGTGTGGCGAAGGGATTTGGAGAATGCAGGAATCACAGGCAAACCTTCAGGACCTGTGTGGCCAGCCCTGCTCGGGCTCACCTGTCCAGACACCCTGGCCTCCAGCCACACAAGCCACTGGCCACGTCAGGAGGCCCCTCTGCCTGAAACACCCTTTCTGCCCAGACACCGCGCAGCTCCTCCTCCTGGTCTTCACTTAAACACCCCTCCAGGATGCATCCCCGGCAGTGGCTGATCTGGCATGCGCAGCCCCAGCCACTCACTGGCCTCTTCATCGAATCCAAGCCGCCTTTCACTCAGCTCTGTCGGTTACAGGTCAACACCAGGAGGGCAGCATTTGTCTCTGGCTCCCAGCGCAGTGCCCGCTGCACACATGGATGCGTGGCCCACTCCTCGGGGCCTTTGCATTTCCTGTTCCCTTGGCCTGGAACGCTCCCTCCCCGAGTCCCTGATCACTGGTGCAGCATCTGTGCCTGCGATCCCTCGCTGGTGGCCACTCCCTGCCACCCCGTGGAGACACCCAGCTCTCCAGCCCCTTCCCTGTCTCTCCAGCCGCACTCTGCAAGTGCAGGGGTCTGTCTCTTCTTCTCTGGCTGCGGCCCAGAGCACAGTGCCTGGCACGACAGCAGATGCCCAGTGTTTGGGGGCAGGAGACCCTGGCCACTCTGTACAGCACAGGGATCTGCATCCAGACAGACCACAAAGGAGAAAACTGGACTGGGGTGGCAGCGGCAGAGGACAGGCCAGGGCAAGGCCCACTTCAGACCCTTTGGGCAGCGTGGAGGAGGAAGAACAAAGGCCAGGGCAGGGCCAGACGCGTGAAATGTCACAGTAGCAAGTTTACGGTGATGGAAGTGCCCGGTTAAATAATAAACCACAATCAAGAAAGCAAAGTGAAGGAGCAGTTTCCCACCGCCCTCCCCAACAGCCTGCTCAGGCAGAAACACGTGTTCCAGACTTACTATCTTGGGATCATTAATGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCACCTGAGGAAGGAAACCATGCACAGGTGAGGCAGGGCCCGGCCCGCTGGGCGGTCGGACTTCCTGAGTGCCCTGCACTGGTTCCCACCTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTTGATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTACAGCAGAATCTTGTACTGCAGATGAGACATTTCAGTTAATAATGAATACACCCCCGTCGCCAGGAACACACCACAGACGCGGGTGCTGCAGAGTGACATTGGTGCAGATAGCACAAAGCTGGCAGGACTGTCCGCGTGGCCGTGGAAAAGCTGGAACTGCCAGCTAGTACTGAGATAGTCACGGAGAGGCAGTGAGAGCATGAGGAAAAAGGGGAAATTGGGAGGTCAACCTAATGGCTCGCTGATAAAAGTTCAACTCGGCCGGGCACTGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAAGCTGGCAGATCACTTGAACACAGAAGTTCAAGAGCAGTCTGGGCAACACGGTGAAACCCCATCTCTACAAAGAATACAAAAATTAGCCGGGCGTGGTGGTGCATGCTTGTGGTCCCAGCTACTTGGGAGGCTGAGGTAGGAGGATCACTTGAGTCCAGGAGGTCGAGGCTGCAGTGGGCCGTGATCACACCACTGCACTCCAGCCTGGGTGACAGAGCAAGACCCTGTCTTTTAAAACAAAGCTCAACTTGTTATCTGAAATAAGATAAAGCAAACTATATTGCAGCATTCAGAAAGCATGAAATTCCGGGAAAAGCTCTCGAAAGCAAACATGTCACCTGGTCATCTTCATACCTCCAAGCAGGTGTCCCACACTGCCAGCACACAGCCGTTTGGGGCCCACTCAATCCCTGTGAGATCCTGGGTGTCCGTATCAAAATGCTTCCAAAGGAAGGGGGGGAAACATTAAATTTGGAAAATATTTTCGTAAATAAATAATTGCATTTATGACTGATGTTCTTAACGCACTTAATTTCCTTATATAGAAATTGACAAAATCTCAACAGCTCTATCCTGGAAATGCATGAAATCCCTGTAGAGCTGCTGCTGGGGCTGCACCGCCACAGATGCCAGCGTCAGTGCCTGGCCAGCCCCCAAGGGCGGCTTGGTCTCCCCGCGCCTGCACTCGTGTGCACACTCTCCCCCTCACCTTTCCTTGCCTGGCCAGCCCCCGAGGGCGGCTTGGTCTCCCCGCGCCTGCACTCGTGTGCACACTCTCCCCCTCACCTTTCCTTGCCTGGCCAGCCCCCGAAGGTGGCTTGGTCTCCCCGCACCTGCACTCATGTGCACACTCTCCCCCTCACCTTTCCTTGCCTGGCCAGGCTCACTCCTTTAGACCCAGCTCAGACAAGTCCCTTCCAGAGCACTGCCTGGATCCCGGGTTCTGCACTCTGACAGCATTCCAGAGGTTGCTCTACCTTAATGATGGATTGTGCTGGAATCGTGTTCATATGTCTGCTGTGGGGGCAGTGCCCTCTGTGCCTGGGCACCTGGCAGAGCGCCCTGCCTAATGCAGGCCCTCAGTCAAGGTGAACTTCCACGTCCCCCCAACTCCCGACGTGGCACACACATGCGCAAACACCATCACACAGGACAAGGAAAAGGGCTCAAATGTGACAGCATATTCACTTTTAAAACACCTGGGCACGCGTCCTTTTCACCAAGTCTCCTGAACACACAACCGGGTGCCACTGGAAGTGATTCGCAGCGCACCTGCCCTTTGTTAATACAACATCACCTTGCTCCATATCCTACCAAAGATCCCCTGGAATCTGGAAGGATCTACTTCACTCGATCCCTCCACAGTCAGCAGGACAACTTTATTCCAGTCTGGGGGACGCCTTACCCGCAGGAGCTGCCAATCACTGCAGACGAAGATGCTCACGTAATCTTTGCAGTCGCGCCGTTCTGCCAGCGCCATGTAGCGGCCGTCCCTGGTGAAGGTGATTC +>ENSE00003789737 +CGTTCCTTGTCGCCAGGAAGTAGCTGTCAGGACTAAATGCCAGCATTCCTATGCCGATTTTCGGGTTTGCTCTGTCGGTAACAGGTTTCAGTGTCTGTAAGGAGACTGGGACAGAGGCGATCTCAT +>ENSE00001852362 +GGGGCTGTGGAACAAGGACGCCCCTGGGCTCCTGGGGAGCGCCTCCTGTGTGCCAGGCTGCACCTGTCCTGACCCCCATCCTGAGCACACACCGAGCCCCGGGGTGGGCCCGTCGGCACTTGGGGCACCGCTTCCTCTACCTGCAACCTTCAGATGCCCTCATGCCCCTGTGGGATGGGTGCTTTTACTATGCCCATTTCAGCGATGAGGAAACAGACACATAGGAAATGCCCAGAGTCAAGAGGCTGCATCAGAACCGGGCCTCAAGCCGGAGACAGCGCTCGGGAGCACCGCCGGGTTCCAGACCCACTCTGAGCGCCACCCACGGAAAAGTGTTTCTTTGAAAAACATCATTCTCGGAGCTCCGGAAAAACATCCCCTCGGAGCTCCCGCTGTCAGATCCGGGTCTCCAGGGCTCATATTCAGTAACAGAAGCCGCACCTTCACGGCCCACTGCGCAATTCAGACCCTAGTCAACCTCCAGCCAACAGGCTGAGGGGCACACTGGCTGGAAGCATGGAAGGGAAAAAAAGTTTTTTTTTTTAAACATAAGGAACATCCGAAGTTTATCTGGACAACGAGGAATCTTGCATTAAAAAAGGAAAACAAATGACATCACATGTGCTACTTACATTTACTCTCTGAGCTCGGGAGAGGGCCGGCCCCGGCCCGGGGCGGCGGGAAGGAGAGGCAGCCCAGTCCCAGCTGTGGGCTCTTCTCGGCCTCCTTATACACCAC +>ENSE00001924010 +AAACATAAGGAACATCCGAAGTTTATCTGGACAACGAGGAATCTTGCATTAAAAAAGGAAAACAAATGACATCACATGTGCTACTTACATTTACTCTCTGAGCTCGGGAGAGGGCCGGCCCCGGCCCGGGGCGGCGGGAAGGAGAGGCAGCCCAGTCCCAGCTGTGGGCTCTTCTCGGCCTCCTTATACACCAC +>ENSE00001659258 +ATTTACTCTCTGAGCTCGGGAGAGGGCCGGCCCCGGCCCGGGGCGGCGGGAAGGAGAGGCAGCCCAGTCCCAGCTGTGGGCTCTTCTCGGCCTCCTTATACACCAC +>ENSE00001813324 +CAAGAAAGCAAAGTGAAGGAGCAGTTTCCCACCGCCCTCCCCAACAGCCTGCTCAGGCAGAAACACGTGTTCCAGACTTACTATCTTGGGATCATTAATGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCAC +>ENSE00003685083 +TATCTTGGGATCATTAATGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCAC +>ENSE00003653006 +TATCTTGGGATCATTAATGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCAC +>ENSE00001866903 +TGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCAC +>ENSE00003492457 +CTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTTGATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTACAGCAGAATCTTGTA +>ENSE00001896684 +CTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTTGATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTACAGCAGAATCTTGTACTGCAGATGAGACATTTCAGTTAATAATGAATACACCCCCGTCGCCAGGAACACACCACAGACGCGGGTGCTGCAGAGTGACATTGGTGCAGATAGCACAAAGCTGGCAGGACTGTCCGCGTGGCCGTGGAAAAGCTGG +>ENSE00003669982 +CTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTTGATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTACAGCAGAATCTTGTA +>ENSE00001839399 +CTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTTGATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTACAGCAGAATCTTGTACTGCAGATGAGACATTTCAGTTAATAATGAATACACCCCCGTCGCCAGGAACACACCACAGACGCGGGTGCTGCAGAGTGACATTGGTGCAGATAGCACAAAGCTGGCAGGACTGTCCGCGTGGCCGTGGAAAAGCTGGAACTGCCAGCTAGTACT +>ENSE00003387437 +AATGAGTACAGCAGAATCTTGTA +>ENSE00003480267 +CTCCAAGCAGGTGTCCCACACTGCCAGCACACAGCCGTTTGGGGCCCACTCAATCCCTGTGAGATCCTGGGTGTCCGTATCAAAATG +>ENSE00003485438 +CTCCAAGCAGGTGTCCCACACTGCCAGCACACAGCCGTTTGGGGCCCACTCAATCCCTGTGAGATCCTGGGTGTCCGTATCAAAATG +>ENSE00001857368 +CCGCAGGAGCTGCCAATCACTGCAGACGAAGATGCTCACGTAATCTTTGCAGTCGCGCCGTTC +>ENSE00000734306 +CCGCAGGAGCTGCCAATCACTGCAGACGAAGATGCTCACGTAATCTTTGCAGTCGCGCCGTTCTGCCAGCGCCATGTAGCGGCCGTCCCTGGTGAAGGTGATTC +>ENSE00000734303 +CCTGCAGACAAGCTTTCGGGTATTTGATGTAAGACACGGATTTTGTGCACAAGGACCAGACGGTTATCCGCAG +>ENSE00001854631 +CCTGCAGACAAGCTTTCGGGTATTTGATGTAAGACACGGATTTTGTGCACAAGGACCAGACGGTTATCCGCAGCTGTTGGGGGAAAGGGGAAAGAGAAAGGAAACACTTCTTTAGCATCATCAGAGACCGTCTCAATCCTCAACCCGCCCACGCGTCCCCAAGCACAGGCCTGACTGCTGGAGTGGATCTATCAGGACCTGGGGGATGCCTGCCCTCCTACCGGAATATTCAAATGCGTATTTTACTGTGGTTACGGTAAATTTGGTGTTCTTGGTTTTCTGTTGTTGTTGTTTTATACCAAAATTGAGTGACACAAAGTTAAATCCAAGTGCTTTTTCATTAGCTTTTTCAAAGTGACCATAGGTTGCATGTTATAATAACCCTGAGTTACTCAGAGAAAAATCTTGATCTAGAAACCACCACGGGTTCAGTCTCCTTTATGGGAAGACAGAGGATCTGGAGATTGGATGCAGCCACTCCGGGACTCACCAGGGGGCTGTGAGCCTGCATCTGCAGCCCTGAGGCAGGAGCAGCCACTCAACACCCAAGAAGGTGTCCGTCTGCCTCCTGCGTGTGCTCGCTGGCCTGGCTGCATCTGCAGAGGGTTCTAGAACATGCGCTGCTGGACTGTCCACTTTTCCACCCCTTTCCCTGACTCAGGGAGCTGAGAGCTGACTAGGCTGGCACAGTGAGGCCAAAAGATGATTTTCTAACCAGGCCGACGAGGGCGTGCCTGCTGAGGGAGAGGCACCGCAGTGGGTGGTCCAGCCCTCCCCGTGGCAGCGCCGCGGGACTTCCAGGGCTGCTGTGTCCCTCCACCTGCATTTCCCACTGAGACCCCGTGGAGCCTACCAGGGAATCATCTTGCTTCCCAC +>ENSE00000734299 +ATGGAATTCCGTGGTGTTGAGAATGTGGCGCCCGTCCGGGCTCCAGCACGAGGCCACCAGCCCGGCTGAGCCCTCGTCTATTTTGCAGTGCCATTCGGGCTGCTCTAAAGACCAGAC +>ENSE00001931622 +TTTAAATGTTCTTAAACTTTAGAGAACGTTATAATTTCAAAAGAAAACTGGCTTTGAGCTGCACGGACTTTTTTTTCAAACTAGAAAGGCACAGAACAAAACCCCTCCTTCCCAGGGGCCCTCAGAAGGTGTCCAGATTCTAAGCGACACGGCAGCACACACCTGCACCAGCCCTCGCTTGTACATGGCGCACAGGATGAAGAGCGAGTCTGCCGACCACTCGATGTGCTGGATCTGGTCTAGGCACGTGTACAGCTGAAGGATCTGAAGGGTGTTCACATCCCGGACCACTAACCGGTACTGGACACAGGAAGC +>ENSE00003566716 +CTGCACCAGCCCTCGCTTGTACATGGCGCACAGGATGAAGAGCGAGTCTGCCGACCACTCGATGTGCTGGATCTGGTCTAGGCACGTGTACAGCTGAAGGATCTGAAGGGTGTTCACATCCCGGACCACTAACCGGTACTGGACACAGGAAGC +>ENSE00003677298 +CTGCACCAGCCCTCGCTTGTACATGGCGCACAGGATGAAGAGCGAGTCTGCCGACCACTCGATGTGCTGGATCTGGTCTAGGCACGTGTACAGCTGAAGGATCTGAAGGGTGTTCACATCCCGGACCACTAACCGGTACTGGACACAGGAAGC +>ENSE00001870155 +CAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGAGAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCCTGCGCCCGAAAACCCGCGGGACCCCTGGGCGC +>ENSE00001477063 +CAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGAGAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCCTGCGCCCGAAAACCCGCGGGACCCCTGGGCGCGCAGC +>ENSE00001680820 +CAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGAGAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCC +>ENSE00001748742 +CAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGAGAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCCTGCGCCCGAAAACCCGCGGGACCCCTGGGCGCGCAGCAGGCTGCAAC +>ENSE00001836154 +CAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGAGAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCCTGCGCCCGAAAACCCGCGGGACCCCTGGGCGCGCA +>ENSE00001858739 +CTGGGCTCGCAGCTCCGAAGCTGGGAGGTGAGGGGAGAGCGATCGGGGA +>ENSE00001475277 +TTTTTTTTTTTTTTTTTTTTTTGAGACGGAGTCTCGCTCTGTCGCCCAGCCTGGAGTGCAGTGGCGTGATCTCGGCTCACTGCAAGCTCCACCTCCCAGGTTCATGCCATTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGACCACAGGTGCCCGCCCCCACGCCCGGCTAATTTTTTGTATTTATAGTAGAGATGGGGTTTCACCGTGTTAGCCAAGATGGTCTCGATCTCCTGACCTCGTGATCTGCCCGCCTCGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGCGCCCGGCCCATCTTAACCATATTTAAGCATCATGCACATTCACATTGCGGTGTAGCCATCAGCAGCATCCATCTCCAGAGCTCTTTTCCTCTTGCAAAACTGAATCTCTGTACCCATGAAGCACCAACTCCCCATTCTTCCCACCCCCCAGCCCCTGCCAACCACCATTCTTAGATGTGATATCTTTGTTAGAGCAGATTAACTTGCTCTCAGGTGTATGGTCTGCGGCCATTGACTCAAGCACAGGGAATGAGAACTTCTGGAAGTGGGCCTGGACATCTGAATTGCACAGGCTTCCCAGATAGGTACGAAGGAACAAGAAACAAAACAAACATTACCGCAAATGAAACACTGTGTAAATATGTGGATTACATCCTGTAAGTACGAAGAGAATGGAAGGCATTTATCTTGTTATTGTCACTGGGGCAGATCCGGAGTCAGCTCTGGGCGGAGATGGATTTACCCTGGAGCTGCTGAAGCTTAAGCTGGGGGCTGCTCAGGAGCCTGGATGTAGAGTAGGAAGCAGTTCTGAGCATGGAGGGGAAGCCAGGTGTGCCAGCCAGAAGCATC +>ENSE00001475269 +CACAGGCTTCCCAGATAGGTACGAAGGAACAAGAAACAAAACAAACATTACCGCAAATGAAACACTGTGTAAATATGTGGATTACATCCTGTAAGTACGAAGAGAATGGAAGGCATTTATCTTGTTATTGTCACTGGGGCAGATCCGGAGTCAGCTCTGGGCGGAGATGGATTTACCCTGGAGCTGCTGAAGCTTAAGCTGGGGGCTGCTCAGGAGCCTGGATGTAGAGTAGGAAGCAGTTCTGAGCATGGAGGGGAAGCCAGGTGTGCCAGCCAGAAGCATC +>ENSE00001890428 +CCGCAAATGAAACACTGTGTAAATATGTGGATTACATCCTGTAAGTACGAAGAGAATGGAAGGCATTTATCTTGTTATTGTCACTGGGGCAGATCCGGAGTCAGCTCTGGGCGGAGATGGATTTACCCTGGAGCTGCTGAAGCTTAAGCTGGGGGCTGCTCAGGAGCCTGGATGTAGAGTAGGAAGCAGTTCTGAGCATGGAGGGGAAGCCAGGTGTGCCAGCCAGAAGCATC +>ENSE00001475263 +TTTTATTGCAGTTCACTTTATTGCACGTCAAGATATTGCCTTTTTTTTTTTTTAAACAAATTGAAGGTTCGGGGTAACTCCAGAGTCAAGCAAGTCTATTGGCAACATTTTCCCACGAGCATGTGCCCACTTTGTATCTGTGTGTCACACTTTCGCAATTCTTGCAATATTTCAAACTTCTTCCTTATTATATCTGTTGTGAAGCTGGTTCTCCCAGACGTTCCCTGCAGGCTGTTTATGCAGCGCCCATCCGAGATGAACCCACAGGACACTCAGGATCCCAGACTGCAGGAGTCGTCTGGGATCACAGGCGGGGCAGAGCAATTTGTCAATGTTTATGAGGAGTCCTCCTTGGCAGCCCAGTCTTTATCCTCACTCACGTGGAAATGAGATTCGACCTCTCCTAATCACCTGGTGCCCGAGGAGCAGGTAGGCGCCTGTCCCAAGCCTGAGTTTCCTGGGAAATCTACATTTCAGCACAGATGGGTTCCCAGCAGCTTAGTGCTCTGGCTGTCCTTAGGTCACTGAATCATTTCACCCGCTAGTTTTTTGTTTGTTTGTTTTTGAGATGGAGTCTTGCTCTGTCACCCAGGCTGGAGTGCAGTGGCGCGATCTCGGCTCACTGCAACCTCCACCTCCTGGGTTCAACTGATTATCCCTCCTCAGCCTCCCAAGTAGCTGGGGTTACAGGCACCCGCCGTCATGCCCAGCTAATTTCCATATTTTTGTAGAGACGGGGTTTCACCATGTTGGTCAGGCTGGTCTTGAACTCCTGACCTCAGGTGATCCGCCCACCTTGGTCTCCCGAAGTGCTGGCATTACAGACGTGAGCCACTGCGCCCGGCCTTGCCCACTGGTTTTATGAGAAAGAGACATGGGAGCCTTTTCCCCAGCTGGGGCAATCATCAGACAGTCACATGGAGTCACAGAACCATCTTGCAACAGCATCCCAAGACCTGGCCATTGGGCAGGATGTGGGACTTGTGAAAGGTCATAAATGACCCTTTGAATCAGTCTCCCTCTGCACAGGAAAAGCCCACCGCCCTGCGTTCACCTTTGCCCATCAGATAGGGCTTGGGGGGCACCTGAGGAGGAGGTGCCTGCCACTGCCTGTGGAGGAGGATGTTGGCGTTCCTATTTCACAAGCCCGGCTTGGAGAGCCAGCGGAGACCTTCTGCGCAGCTAGCTCTTGCACACACCCCTGCGGAGAAACTCTGCCTTCTTGCCTGGGGCCCAGAACCTTACCCACCCAGGCTTGCCCCCTCCCTTCCAGGGCCCACTGACCTCCTGACTCAGGCTCCCCCGAGTGCCTGACCCTGTGAGTCACTGGCCCATCTACAATCCTTCTCCCCGTGACTGCTTGAGTTGTAGCTTGATTGGAGCCAGGTCAATGCAAGTCACAGAACTGCGAACTGAGATGGACTCTCAGAAGCAAGAGGTGGCAAGCATGGCGGAGAGGAAGCGAGGGTCCTCCTGGCTGGTTAGATCTTACAGAGTTTAAGCTGTACTGAGAGTTTTTATGAGGACAAGGGGCCAGTCCTGTGCCTGCCTGATGTGGAGTCCTAGGCGGGCTTGGGCCGCAGGTTACCTGCTCCCGGAGGCTCACAAAGGCAGTGCCAACAGGCGCTCATTCTCAGCAATGGGTGAAAGTAAGAGGAACCTGCCCTCCCTCCTCTCCACACCTCCCCAGTATTTGTCCTCATGGAGTAAATATCCAACAGTGATCCCAGGGCATGGGAGTGGGAGTTAAGGCAAATGCCAGACTGTCCAAGGCTCATTACAGGGTAGTCCTCTCATCCTCTGCTCACTAGTCCACTATATTCAGTGAGCACCCACTGTGCACCCTGTGCCTTGGGGACGTGGAGGCACGCTCAGCCCCAGCCTCGCCCTCCGGGAGCTTACAGTCTAACCCTCTGGGCACAGGGAGGTGGGAAGATGGCACGGCCTTGCTGGGAGCCTCACCCTGTTGGCTGAACAATGATTTTTTCAATAATGCCTACAGCTTCCTTCATATCCTGCCACCCAAACCAGTGCCAAGGTCATCATGGGCTTGTGTGGCACAGTCAGATTTAGTGACCATCCCCACTCCCACATTGGTTCTGTCTTCTTGCCCCCGGTGCTCTGGTCCCTAGCACAGGCTGCTGATTTGGGGACTCGGGGGAGAATCCTCCACCTTCTGCAAATGCTTAGCCATGAAATGACGGGTGTTTGCCTGACTATGATTTCATGAATCCCCCATGAAATGATGGGTGTTTGCCTGATTATGGGCCAACAGTGCCCCCCACTCCTCGTGGGCACTCCTGGGATCAGCAGCCCCTTCCTAGCCTTCACAGGGACTCTAGGCCTCCATGGAAAAGAAAGAAATAAAAAATTTTTTTTGAGACAGAGTCTTGCTGTGTCACCCAGGCTGGAGAGCAATGGCTCAATCTTGGCTCACTGCAACTTCAGCCTCCGAGGTTCAAGTGATTCTCTTGCCTCAGCCTCCCGAGTAGCTGGCACATGCCACCACACCCGGCTAATTTTTGTATTTTTAGTAGAGACGGGGTTTCACCATATTGGCTAAGCTGGTCTCGAACTCCTGACCTCAGGTGATCCACCCGCCTTGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGCGCCCGCCCAGAAAGAAAAATCTTAACAAGTTGCTTCCAGTAACCAGTCTCAATGAGTAGCAGGGAGTAGTTTGCAAGAAAAAAAAACAAGTGAAGATGTTTCCCATTCTTTAACCTGCTCCATCCCTCAAATTCCTGCTGCTCCATGGCAGGGGCCCTGCTCACCCCACATTGGCACAGACTCTGCTGGAGTCAGATCCTCCAAAGCCACAAGCTTCCTTGAGGCCACGGGGCCGCCTCATTCTTGTTCTGCCCCTTCCTCACACTGAAAGACTGCATAGCCTGGGGTGCAATGCCCAGGTGTGAAATTGATGCTCGGGAAAACAAATCCTTCCCAAAGTCACTTAAGGAATCCCCCAGCCCCACCGCACAGACCCCTGGATGTATACTGCCCCTATAATTCTGCTCTAGGCAGAAAAGCCTAGGAGTGGAGGTGACAGCTCCCAGCATATGCACCCTTTTGCTCTGCTCTGCTGCCCTGTAGAGCCCTGGAAGTGACCAGAGCCCTTAGGCTACTGCTGCTGCATGCCCAGAGGGTCCCAAGCAGAGCTGGGCAGGAGGTAGGCCCAGGCAGGGCTGGGAGAGCAGTGACCAGGCAGGGTGCACGGCTGCACTTTGCCCAGGTCCTGGCTCTGGCTCTGGTCTGGTGCCAGTGCTGGGGTGGGTGTGTCGGCTGCCCACGCAGCTGCGGGGTCCAGTTCCAGAACTATCTCCACCAGCTGGGATGGGGGGCTTCTTCTTCACCCTGCTGCCTCTTGTCCTTTCTTCTCCAGCCAAGTTGGGGGTGAAGCAGGGACGCTCCTTTTATTCCCTGAGCCGAGCCCCAGCCCCAGGGCTTTCAGTCTGCCACGCCAGTCACAAACAGCCGGCTTCCGGCCTGGGTGTGGGTACTGGGCTGGCCCCTAATGATGGGAACAGCAGCCGCCACCAAGAGCTTCAACCTGTCCAGTGCCCCAAGGTCCCAAGCAGTCGGCAGGGTCTGTGGATCGGCCGAGGGGCTACCACGGCCGCCAGAGGCCAGGGCCGCAGGGAGGCGAGGGCGGCGAGGGCACCGGAGCGGATGCGGGCTCTGGGGCAGACGCGGGCGCTGGGGCGGGGGCAGACGGGCCACTGGAATCCCCAGCGCGCCCGCCGTCCAGGGTGGCGCTGGCCGCTCTCCGCCACAGGTGCTCCAGCAGGCGCGCGCTCACGGCGGGCTCCAGGACACGGCAGGCGGGCAGCACGCGGGCCAGGCGCGCCACACAGGCGCTGTAGCCCTCGCGGTAGCTGTCGCAAGGCA +>ENSE00001948071 +CTCCTGACTCAGGCTCCCCCGAGTGCCTGACCCTGTGAGTCACTGGCCCATCTACAATCCTTCTCCCCGTGACTGCTTGAGTTGTAGCTTGATTGGAGCCAGGTCAATGCAAGTCA +>ENSE00001854189 +CCAAGCAGAGCTGGGCAGGAGGTAGGCCCAGGCAGGGCTGGGAGAGCAGTGACCAGGCAGGGTGCACGGCTGCACTTTGCCCAGGTCCTGGCTCTGGCTCTGGTCTGGTGCCAGTGCTGGGGTGGGTGTGTCGGCTGCCCACGCAGCTGCGGGGTCCAGTTCCAGAACTATCTCCACCAGCTGGGATGGGGGGCTTCTTCTTCACCCTGCTGCCTCTTGTCCTTTCTTCTCCAGCCAAGTTGGGGGTGAAGCAGGGACGCTCCTTTTATTCCCTGAGCCGAGCCCCAGCCCCAGGGCTTTCAGTCTGCCACGCCAGTCACAAACAGCCGGCTTCCGGCCTGGGTGTGGGTACTGGGCTGGCCCCTAATGATGGGAACAGCAGCCGCCACCAAGAGCTTCAACCTGTCCAGTGCCCCAAGGTCCCAAGCAGTCGGCAGGGTCTGTGGATCGGCCGAGGGGCTACCACGGCCGCCAGAGGCCAGGGCCGCAGGGAGGCGAGGGCGGCGAGGGCACCGGAGCGGATGCGGGCTCTGGGGCAGACGCGGGCGCTGGGGCGGGGGCAGACGGGCCACTGGAATCCCCAGCGCGCCCGCCGTCCAGGGTGGCGCTGGCCGCTCTCCGCCACAGGTGCTCCAGCAGGCGCGCGCTCACGGCGGGCTCCAGGACACGGCAGGCGGGCAGCACGCGGGCCAGGCGCGCCACACAGGCGCTGTAGCCCTCGCGGTAGCTGTCGCAAGGCA +>ENSE00001914446 +AGGGTCTGTGGATCGGCCGAGGGGCTACCACGGCCGCCAGAGGCCAGGGCCGCAGGGAGGCGAGGGCGGCGAGGGCACCGGAGCGGATGCGGGCTCTGGGGCAGACGCGGGCGCTGGGGCGGGGGCAGACGGGCCACTGGAATCCCCAGCGCGCCCGCCGTCCAGGGTGGCGCTGGCCGCTCTCCGCCACAGGTGCTCCAGCAGGCGCGCGCTCACGGCGGGCTCCAGGACACGGCAGGCGGGCAGCACGCGGGCCAGGCGCGCCACACAGGCGCTGTAGCCCTCGCGGTAGCTGTCGCAAGGCACTGCGGGCGGAGAGCCGCGTGAGGCGCGGGGTAGGGTGCCGGGTGCGGGGTGCAGAGCGCGCGGCAGGGCAGGGAGGGCTCACTCACGGGGCGCTGCCGTGGGCCATGAGGACGCAGGCAGCTCCTGCAGGAAGCGCACGGTCATTTCCAGGACGTCTGCCTTCTCTAGCTTCGAGCAGTTGGAGTT +>ENSE00000734533 +GGGGCGCTGCCGTGGGCCATGAGGACGCAGGCAGCTCCTGCAGGAAGCGCACGGTCATTTCCAGGACGTCTGCCTTCTCTAGCTTCGAGCAGTTGGAGTT +>ENSE00002817476 +CTCCCGGCCCAGCAGCGGCAGGATGAGCCCCTTAAGCTGGCTCAGGCTCTGGTTGATGCGCGCGCGCCGGCGCTTCTCCAGCAGCGGCTTCAGGCT +>ENSE00001916716 +CTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGCGGTGGCAGCTGCGAGCCCCACGCAAAGGGAAACCGAGGTCCGAAATGAGGTCCCGGGCGCGGCCCGGGCTGG +>ENSE00001475267 +CTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGCGGTGGCAGCTGCGAGCCCCACGCAAAGGGAAACCGAGGTCCGAAATGAGGTCCCGGGCGCGGCCCGGGCTGGTGCCAGACGAGT +>ENSE00001475271 +CTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGCGGTGGCAGCTGCGAGCCCCACGCAAAGGGAAACCGAGGTCCGAAATGAGGTCCCGGGCGCGGCCCGGG +>ENSE00001835288 +CTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGCGGTGGCAGCTGCGAGCCCCACGCAAAGGGAAACCGAGGTCCGAAATGAGGTCCCGGGCGCGGCCCGGGCTGGTGCCAGACGA +>ENSE00001475281 +CTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGCGGTGGCAG +>ENSE00001150483 +CTCTGGAATTGCGTCGCCGGCGCCTGGAACCGCAGTTAGCGGGCACTGGGCAGATGAATGAATTTGTCTGTGCCTGGACGGCTCTCCAATTCGAACCCAGTTTTGCTGCCCTCTGGGGTCTCAACTGTTACGTGAGGCAAATTAGGAGAGAAGCCCCTGGGCACCTTGCCCCAGTCGCACGAGTGTCCCCGCG +>ENSE00003790229 +TTACATTTTTAATAGACTTTTATTTTGGAATAATTGTAGATTTACAGAAAAGCTGCAAAGAATAGTACAGAGAGTTCCCTCAAATTCTTCGCCCAGTTTCCTCTAACATTTGCATCTTACACAGCCATGGCACATTTGTCAAAACTAAGAAATTAACACTGGTATTACTTTTAACTAAAGGCTTTTTTGGATTTTACCAGTTTTTTCACTCATGCCTTGTTTTGTTCCAAAATCCAACCCAGGATATCACACTGCATTTAATCAAATGTAAATACGTATGCTTTAACTTTTTTATTTTAAAATAATCATAGATTTACAGGAAATTGCAACAACAACAAAAAAAGTACAGAGATTCTGTGTACCCTTCCCCCAGTTTCGTTCAGTGGTAACTCCTTGTATAACTACACAATATCAAAACCATGAAATAGATATTGGCACAATCCATAGACAGTATTAAATATACATGCATATATATATATTTTTAAGTGAAAAATATTTTTAAACCTCGCTTTGCCTCACAGCCAAGAAGATCAAATACTTTCTCCAAAAACATAGAATTTGTATCTAACTCCACTCGCTCCAAACTCAAGTCCAACCATGAAATTATTGATCCCTCTCTCTAACCCTCCAACTACAGGCAAGAAGCTGCCCATACATTCCCCAAAGCAGGAGTGCACTCTGCCACAGGCCTAGATGCCGTCAACCTCCTGGACCTTGAACTCCCTAAATTAATGGCCTCTGTGTGAGTATGTGTAAGCAGCCCCTCTCTGTCCCAGTCCATCCTAAAATCACTCCCTTGGAGCCACCACTGCCCCTCTCATCTTCTAGAATTTCTAGAAAGATAAAGAGCTAGATAAGCATCTAGGTACCTTTCTTCTGCTGTTAGCTCTAAAGACAAGTGAATATATCCTAGCTAGGATGTACTCTAAGGAATGCAGAAGTAGGCCGAGTGCAGTGGCTCATTCCTGTAATCCCAGTGCTTTGGGAGGCCGAGGTGGGCGGATCACCTGAGGTCAGGAGTTTGAGTCCAGCCTGGTCAACATGGCAAAGCCCCGTCTCTACTAAAAATACAAAAATTAGCTGGGCGTGGTGGCGGGTGCCTGTAATCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATCACTTGAACCCCCAAGGCAGAGGTTGCAGTGAGCTGAGATGGTACCACTGCCCATTTCAAAAAAAAAAAAAAAAGAATGCAGAAGTAAATTAAATGACCACAAAGAGTTTTTTTTAATTTGAGACAGGGTCTGGCTCTGTCACCTAGGCTGGAATACAGTGGCGCAATCTCAGCTCACTTCAATCTGTGCCTCCTGGGCTCAAGCCATCCCCTGACCTCAGCCTCCTGAGTAGCTGGGACTACAGTCCTGCCACTATGCCTGGCTAATTTTTGTATTTTTTGTAGAGATGTTGCCCAGGCTGGTCTGAAACTCCTGAGCTCAAGGGATCCATCCACCTGGGCCTCCCCAAGTGCTGGGATTACAGGCATGCGCCACCGTGCCCAACCCAGACATCACTTTTATCTGAAGCAACAACTATCTGCTCTTTCTGTTTCCTTACTAATTATCCAGGAACTTTTACAGGTGAACTCTGAGGAGGACAATTTTTATTGTTTTTATGTCAGCATAACTAAAAGTAAAGCTGGATAGGAAGAGGTTACTTGAAAATGATTTCACCTGAACTCAAATGAATAAGCTGGCTACTGCATAAAGCAACAGAGGGGTCCCTTTAATTTAAAAGCTCAGGACTCTGAATCAATTGCTGGTTGGGAGAAGGTAGAGACATTCTTTACTTCTGCCTAGAACTGGGGAAAATGGCGTAGACTTCTGCTCTGAAGCAGTCCTCAGTGCTGCTTCGGTCAGAACTCCCGAGAGGCATCTGAGTGCTGGCCTGTCACTGCGGCTGGCATTCCAGGCATTTCATTGGCCCCACTTCAGCCCACGCCTGGCTCCACGGGGCTGGGCAGCTGAGGGGAGTTTGTGGCAGAGTGGGCATGGGGCACGGCCCGTGCAATGTGCGTTACAAAGGGGCTCTCTCTGAAGCAAGTCCTCTGCACTCCAGTCTATTTGAGGAAGAAAAGGACAATTCCCATAGGGAGGGGGTTTGCTGAAGCAACCAGCTGCCTGGTTTCCTCTCCAGCATTGAGAGGGAGGGAGGGCTGGCTTAACTGGGGGACGGCCTTCTCATCTGGACTGTGTCAAGGCCAAGGTTAGGCTCCAAATTCCAGAAAACCTCTCTGCAGGGTCTTCTTTCAGAGTGGTGAGAATGGAAGCAGGCTCCCTTCCCCTCCAGCACTAGGAAGCCCCGCAATTGGTGAGGTGCAAAGAAAGATGGGCCCAGGCAGGGAGGCGGGAGCAGGGGAGGTGCCCAGGGCAGTGGCTGGAAGGGCAACGGGAGAAGCAGCAGAGGCTGGGGGTGGGGGTCGCAGCAGGTGCTGTCCCTGGCCTGTGTGAAAGGTACTAGAAGGCCCCATCCTTGGTGCCACATGGACCCCAGAGGCTTGTCTTAGTCCATGGGGTCCGAGGTGTAAGACACTTACGTTTGGCGTCACCTCTTAGGCTTGGATGAATTTCAGAAAGTGCTAGACTGGAGAACAGTGGAAAAAATCAGTGGAACAAGATCTGGAGCACTCACTGCTCAATGTCAATGTTAGAGAGCACAACGACACCAATGGGAGGAGGGTGAGGACCAGAGGCTGATTGCATGAGCTCTGTTGGAGTGCAGGACCCACTAACGGGTTATCTCAGGGTTCCTGGAGGCCACGGCTGTGCCTTGTGGTCCAAGACCTGGGGAAGCCACCACTGTGTCTTCCCTCTCCATCCTCCGGTGACTTTGGTCCAATTCCTGTTGCCATGGCAATCAGCCCAGCTGGCCTCACAGTTCACTGGCCTCAAAGTTGGCATCTGTAGGTGAAGCCAGTGGGACCCAGAGAACTTAATTCTTCTCAACTGAGCTGGCTTGGAGGAACTTTTCTCATCAGCCACTGGAGCAGAGAACGTCACCAGCGTCTCACTGACGTCAACATCCTGGGCCTGGCTCTAGCTGAAAAGGAAAATTCTCCCCAAGGCAGACACATCTCCCGAAGCCCACACAGGCACTTTCTATGATTGCACTGGAAATCTGTCTCCTGGGGACAGGGAGCGCGTACGCTCACAGTCAAGTCACAATGTTGAGCAGTCTCCAGGACTCCACGTTCATCTCTAAGAACAGGAGCCGGTGGTTGGGCGCAGATTCTTGAGCCAGATTGCTCGCGTTCAAAACCTGGTCCCTTTTTATTAATTGCATGCTTAGTTACATTTTCTGTTTGTACTTTTGTTTCCTTCTCTGCAAGACGGGGTTAATCACAGACACTTGTACATGATGTAATACACTTACAATACTTAGGACAGGCCTTCCTGCATAGTAAGTGCTCTGCAAACACTGGCTACTATTCTCCCTACGTGCAAACTTCTCCCAGCCAAAAGCCGCCCACACCAAGCCCCTGTGCCTTTTTCCTTCCGCACCCACGAGCAGGCTGCTCCTGGGGCCCTGGAGCTCACTTTCCCAGCCGCCCTCACCACCCACCGTGGCGCAGAAGAGCTTCCGAAGTCCTGGCGTCTCCCACTGGTCTGGGCATCTCTCGCTTCATCTTCCCTCTTGGGCCCCACAACGTGCAGCACTTCTAGGGCAGTATACTTGCTGATTGCTTCCTTACTATTGCTCACAACAACCAGCTAAGACACTGCCAAAGAAACACTCACAGCTGGCCGGTCCACGGCATCCGGAGGGGACTCGGGGGACAGGCCTGTCCTGCCTCTCCCCAGCAC +>ENSE00001500136 +GGGCCCCACAACGTGCAGCACTTCTAGGGCAGTATACTTGCTGATTGCTTCCTTACTATTGCTCACAACAACCAGCTAAGACACTGCCAAAGAAACACTCACAGCTGGCC +>ENSE00003787977 +CTGGGTGCATGCTGGGACGGGGCGAGCAGGTAGTGCAGGCTTCCAGGCCTCTCCTGCCCCGGAGCTTGGCTGCAGGACTCCCGCAAAATCTCCAAATGCCCCCGATCTGCGTGGTCACCGAGAAGCAGCCCGGCTCGGAACAAGCCCAGGCAAGCCCAGGCAGAGCCCGCCGCCGGGTCCTCCTTCCTGCTCGTGCCACCAGGCCCCGGGGCCGCGACGCGTCTCTCCAGCCCGGGATCCGGGGAGCTGGGCTGTCCCCAGACCGACGGGACAGCGGCATCTCCTCCACCTGAAAAGGAAAGAGGACCAGGTGGGGGCCAGGCAGGGCGCATGAAGGCGGCGCCAGCACCGCGCGATCCGAATCACGTCGGTGCGGGGGAGGGGTC +>ENSE00001658885 +CTGGGTGCATGCTGGGACGGGGCGAGCAGGTAGTGCAGGCTTCCAGGCCTCTCCTGCCCCGGAGCTTGGCTGCAGGACTCCCGCAAAATCTCCAAATGCCCCCGATCTGCGTGGTCACCGAGAAGCAGCCCGGCTCGGAACAAGCCCAGGCAAGCCCAGGCAGAGCCCGCCGCCGGGTCCTCCTTCCTGCTCGTGCCACCAGGCCCCGGGGCCGCGACGCGTCTCTCCAGCCCGGGATCCGGGGAGCTGGGCTGTCCCCAGACCGACGGGACAGCGGCATCTCCTCCAC +>ENSE00001670416 +AGTTTGCAGGACTCCGAACTGGGCCCGCGAGATCTCCACCTGCGCAAAACGAAAGGGCGGATTCTCCTTGGACTCACGAGGCAACCGCTCCCCGGGGTGAGAACGGGGGACTCATTCCTC diff --git a/pygtftk/data/mini_real_10M/expected_sequence_minus_no_rv.fa b/pygtftk/data/mini_real_10M/expected_sequence_minus_no_rv.fa new file mode 100644 index 00000000..e9385727 --- /dev/null +++ b/pygtftk/data/mini_real_10M/expected_sequence_minus_no_rv.fa @@ -0,0 +1,92 @@ +>ENST00000338370 +AAAGGCTGAGTCCTCTGAGAATTTATTACTACGGATCACAGCAGCAACGGGCGGGAAGGGCGGCGCCAGACTCATTTGCCCCGCAGGTAGATCTTGGGGGTCTGCCAGCCTTCGGGGGCTTCCTTTAGCCCCGCCTTCAGCCAGATGCGCCTCAGGTCTTTCTCGAACTTGATCTGCTTGCGTCTCAGGCGTCCCTCCTGGACCTTCCTCCGCAGGAACCGCGTCTTCTTCACCAGCTTCCGGTACTTGTGGTGGTTCATCTTCCGCCGGCGGATCTTCAGCACGTTTTTGCACTGAATTTGAGGCGCATCCGCGACGCCTTCATCCCCCTGCTCGGCCCCTTCCCCTATCTGGCTGGGCGGACACTGGTAGGATTGCGGTGGAGCCACAGTCCCTGCGGTCCCGGTATCCAGTCTGGGCAGGAAGCAGCGGGCCGTGAGCCAGCTCTCCAGGGGGCTGACGGACATCTTCCTGGGGACCAGCATCTCCTCCAGCTCCAGCTGGGCCCCCTTGCGAGGGAGAGAGGCCGCCCTACCTGGGCCGGCCGGCGATGTGCTGTAAAGGGGCCCGCAGACCCGGCTGCCCAGCACTCCAGAGACGGGCCAAGGCGGGCGGCCGCCTGCCCAAGGAACGGCCCTCAACAGCTGGGAAGTCAGGCGCCCCAGGAGCATGGTCTGTGGGCGGCGGCCACAGGTCCCAGGGGAGCTGGAACACAAGTGCCCGTTCAGGTCAGGCGGCAGCGCCTTCAGTAGTCGCGGGCGGGCCGGGACTGGGGCGTCTGGTCCCGCCGCGACCCTCGCTTCCCTTCTCCCTCCGCCACCCCAACCCACAAGGAGGACTTTGCTTCCAACACAGCTCGCGCCCCGAGGCTCCCAAGCCCCCGACGCGGGCGGTGTCGCGCTCGGACGCACCGAAAGGTCCCAGAACGGGGAGGCCGGCCCCCTCCCCGGGTTCACCCCCGCGCGAATCGCGTTGCCTGGCGCCCGGACCCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGCGCCCTCAGGCCTCCCGCTGACCCTTCCCAAGCCCGACCTCG +>ENST00000338338 +AAAGGCTGAGTCCTCTGAGAATTTATTACTACGGATCACAGCAGCAACGGGCGGGAAGGGCGGCGCCAGACTCATTTGCCCCGCAGGTAGATCTTGGGGGTCTGCCAGCCTTCGGGGGCTTCCTTTAGCCCCGCCTTCAGCCAGATGCGCCTCAGGTCTTTCTCGAACTTGATCTGCTTGCGTCTCAGGCGTCCCTCCTGGACCTTCCTCCGCAGGAACCGCGTCTTCTTCACCAGCTTCCGGTACTTGTGGTGGTTCATCTTCCGCCGGCGGATCTTCAGCACGTTTTTGCACTGAATTTGAGGCGCATCCGCGACGCCTTCATCCCCCTGCTCGGCCCCTTCCCCTATCTGGCTGGGCGGACACTGGTAGGATTGCGGTGGAGCCACAGTCCCTGCGGTCCCGGTATCCAGTCTGGGCAGGAAGCAGCGGGCCGTGAGCCAGCTCTCCAGGGGGCTGACGGACATCTTCCTGGGGACCAGCATCTCCTCCAGCTCCAGCTGGGCCCCCTTGCGAGGGAGAGAGGCCGCCCTACCTGGGCCGGCCGGCGATGTGCTGTAAAGGGGCCCGCAGACCCGGCTGCCCAGCACTCCAGAGACGGGCCAAGGCGGGCGGCCGCCTGCCCAAGGAACGGCCCTCAACAGCTGGGAAGTCAGGCGCCCCAGGAGCATGGTCTGTGGGCGGCGGCCACAGGTCCCAGGGGAGCTCGACGCGGCTCAAATTGACCGTTCTGCGGCCGCCCTCGGGCACTTCCGGTCCGTCCCCAAGTCGGCCCCGATCGGCAGCGGCCACCCGGCGGTTCCTACGCACAGCGCCCGCTGGCGTCCTCGCGGCCCCCGATTCTGCATTGGCTCAGGCCCCGCCGGGCCCGAAAGGCGACGGTTTCCGGTTAGTGGAATCACGGTCCCAGTCCTCGCGCGGTTCCTCAGCTCCGCCTGGTCCCTTACGGAGGCAAAAAACTACATTTCCCACAATCCCAGGGGGTGCGGGCCCTGGATATACCCGCAGGTCCAGAATCGTTTCCGGACCACCCAGGGGCCGGATTCC +>ENST00000321751 +AGGCTGAGTCCTCTGAGAATTTATTACTACGGATCACAGCAGCAACGGGCGGGAAGGGCGGCGCCAGACTCATTTGCCCCGCAGGTAGATCTTGGGGGTCTGCCAGCCTTCGGGGGCTTCCTTTAGCCCCGCCTTCAGCCAGATGCGCCTCAGGTCTTTCTCGAACTTGATCTGCTTGCGTCTCAGGCGTCCCTCCTGGACCTTCCTCCGCAGGAACCGCGTCTTCTTCACCAGCTTCCGGTACTTGTGGTGGTTCATCTTCCGCCGGCGGATCTTCAGCACGTTTTTGCACTGAATTTGAGGCGCATCCGCGACGCCTTCATCCCCCTGCTCGGCCCCTTCCCCTATCTGGCTGGGCGGACACTGGTAGGATTGCGGTGGAGCCACAGTCCCTGCGGTCCCGGTATCCAGTCTGGGCAGGAAGCAGCGGGCCGTGAGCCAGCTCTCCAGGGGGCTGACGGACATCTTCCTGGGGACCAGCATCTCCTCCAGCTCCAGCTGGGCCCCCTTGCGAGGGAGAGAGGCCGCCCTACCTGGGCCGGCCGGCGATGTGCTGTAAAGGGGCCCGCAGACCCGGCTGCCCAGCACTCCAGAGACGGGCCAAGGCGGGCGGCCGCCTGCCCAAGGAACGGCCCTCAACAGCTGGGAAGTCAGGCGCCCCAGGAGCATGGTCTGTGGGCGGCGGCCACAGGTCCCAGGGGAGCCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGCGCCCTCAGGCCTCCCGCTGACCCTTCCCAAGCCCGACCTCGACGCGGCTCAAA +>ENST00000378853 +GAGTCCTCTGAGAATTTATTACTACGGATCACAGCAGCAACGGGCGGGAAGGGCGGCGCCAGACTCATTTGCCCCGCAGGTAGATCTTGGGGGTCTGCCAGCCTTCGGGGGCTTCCTTTAGCCCCGCCTTCAGCCAGATGCGCCTCAGGTCTTTCTCGAACTTGATCTGCTTGCGTCTCAGGCGTCCCTCCTGGACCTTCCTCCGCAGGAACCGCGTCTTCTTCACCAGCTTCCGGTACTTGTGGTGGTTCATCTTCCGCCGGCGGATCTTCAGCACGTTTTTGCACTGAATTTGAGGCGCATCCGCGACGCCTTCATCCCCCTGCTCGGCCCCTTCCCCTATCTGGCTGGGCGGACACTGGTAGGATTGCGGTGGAGCCACAGTCCCTGCGGTCCCGGTATCCAGTCTGGGCAGGAAGCAGCGGGCCGTGAGCCAGCTCTCCAGGGGGCTGACGGACATCTTCCTGGGGACCAGCATCTCCTCCAGCTCCAGCTGGGCCCCCTTGCGAGGGAGAGAGGCCGCCCTACCTGGGCCGGCCGGCGATGTGCTGTAAAGGGGCCCGCAGACCCGGCTGCCCAGCACTCCAGAGACGGGCCAAGGCGGGCGGCCGCCTGCCCAAGGAACGGCCCTCAACAGCTGGGAAGTCAGGCGCCCCAGGAGCATGGTCTGTGGGCGGCGGCCACAGGTCCCAGGGGAGCGAAAGGTCCCAGAACGGGGAGGCCGGCCCCCTCCCCGGGTTCACCCCCGCGCGAATCGCGTTGCCTGGCGCCCGGACCCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGCGCCCTCAGGCCTCCCGCTGACCCTTCCCAAGCCCGACCTCGACGCGGCTCAAATTGA +>ENST00000489799 +GGCAGGAAGCAGCGGGCCGTGAGCCAGCTCTCCAGGGGGCTGACGGACATCTTCCTGGGGACCAGCATCTCCTCCAGCTCCAGCTGGGCCCCCTTGCGAGGGAGAGAGGCCGCCCTACCTGGGCCGGCCGGCGATGTGCTGTAAAGGGGCCCGCAGACCCGGCTGCCCAGCACTCCAGAGACGGGCCAAGGCGGGCGGCCGCCTGCAGAAAACCAGACGCCACGGTCACCGCTCGCGAGACCACACAGGCCCGTCGGGTTGAGGAGCAGCAGGTTCGTCCCAGCGAGGATCCCCCGCACCTCATTCCTGGCCTGAACCCCTGAGGTTCCCTCTGTGAGCATCGGAAGCTTAGAGGGGAAAGAGTGTGTGTGTGGCCACCGGCCCTGCCCCAGCGGAGCTGCTGAGACCCGCACTCCTAACCAGGTGTGCATCCTCCCATCCGCCCCCGCGCGGCTTCCTACCTGCCCAAGGAACGGCCCTCAACAGCTGGGAAGTCAGGCGCCCCAGGAGCATGGTCTGTGGGCGGCGGCCACAGGTCCCAGGGGAGCGAAAGGTCCCAGAACGGGGAGGCCGGCCCCCTCCCCGGGTTCACCCCCGCGCGAATCGCGTTGCCTGGCGCCCGGACCCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGCGCCCTCAGGCCTCCCGCTGACCCTTCCC +>ENST00000496905 +GCGGCCGCCTGCAGAAAACCAGACGCCACGGTCACCGCTCGCGAGACCACACAGGCCCGTCGGGTTGAGGAGCAGCAGGTTCGTCCCAGCGAGGATCCCCCGCACCTCATTCCTGGCCTGAACCCCTGAGGTTCCCTCTGTGAGCATCGGAAGCTGCCCAAGGAACGGCCCTCAACAGCTGGGAAGTCAGGCGCCCCAGGAGCATGGTCTGTGGGCGGCGGCCACAGGTCCCAGGGGAGCTGGAACACAAGTGCCCGTTCAGGTCAGGCGGCAGCGCCTTCAGTAGTCGCGGGCGGGCCGGGACTGGGGCGTCTGGTCCCGCCGCGACCCTCGCTTCCCTTCTCCCTCCGCCACCCCAACCCACAAGGAGGACTTTGCTTCCAACACAGCTCGCGCCCCGAGGCTCCCAAGCCCCCGACGCGGGCGGTGTCGCGCTCGGACGCACCGAAAGGTCCCAGAACGGGGAGGCCGGCCCCCTCCCCGGGTTCACCCCCGCGCGAATCGCGTTGCCTGGCGCCCGGACCCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGCGCCCTCAGGCCTCCCGCTGACCCTTCCCAAGCCCGACCTCGAC +>ENST00000378602 +ACCACTTAAATACAAACTTTATTCTCTCTCCAAGAAGATGCAGACGTCACAGGTGGCCCTGAGCTCCCACCCGAGGCTTAGGCCCAAGGGGCCTCTTCCAGGCTGAGGGCCTGCTGGGGCTGGGCCAGGGGCTGAGGCTGAAAGCAGCAGCCTGCCTAGTGGGTGACGCCAGGGGCCGGTGTAACATGGCACCGAGGTTGGGGCCACAGCAATGTGTGGGACGGTGGGGTGGGCTGGGGCCCTTGGCTCCAAGCATTAGTTCTCCAAGCTCTGGTCCGTTCTCCTACCTCCTTCAAGGGGCACCAGGGCTACAAGGTGGTAGTTGAGTATTGGGGCCCGACTCCTGGGGCACTGGAGTGGTCTCTAGGCCCGAGGCCCCAAGGAGAGGGCTGGGTTTCTGGGAGAGTGCTGGTCCTTCCTCTCTGGGCTTGGCCATCTTGACAGCTTCATCGTAGGAGGGTGGAGGCTCCGGGGTGTACAGGCTGTAGGCAGGAGGAGCCATGGAGTCCAGGTCCAGCTCCCCAAAGGGCAGGGGCAACCGCATGCCCAGTGGGTACTGCACGGAGCTGTAGGAGGTCACAGTGCTGTGTACAGGGCTGTCACTGTCCATAGGGATGACTGCCACGTCGCAGGGCTGCCGTGCTGGTGGCAGATGTGGCTGGGCCTGTGCCTGCTTCCGGAGGCAGCAGAACCGGACACAACCAGCTGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGCCTAGGAGAGCAAGGCTCTACCACTGGACTGACCCTCGGCCACCGGGCACCTGCACCCTGGGGAATGTCGTGGCACAACCACCGAAGACAGGTTAACAGGATAAAAAGCAGACAATGTCTCTCCATGTCGGAGACCGCCGTGGCCAGAGCCTGGCCTCGGGCTGCTGGGCCTGCCCTGGCTATCTCTCCTGGGCTGGCCAGGGGTGGCCTTGGGCTCACTCCCAGGACTCGCTGTCCTCAGCGAGTGCCCCACTGCTGAGCGGGATCGTAGGGGACTCCCGCGGAGGCCAGGCGGGAGAGGTGGGAGGGAAGGTCCTGCTTGCTCCAGGTCAGTTCCCGCCAGCGGCCGGGACTGGGCGACAGCGGA +>ENST00000310991 +CCACTTAAATACAAACTTTATTCTCTCTCCAAGAAGATGCAGACGTCACAGGTGGCCCTGAGCTCCCACCCGAGGCTTAGGCCCAAGGGGCCTCTTCCAGGCTGAGGGCCTGCTGGGGCTGGGCCAGGGGCTGAGGCTGAAAGCAGCAGCCTGCCTAGTGGGTGACGCCAGGGGCCGGTGTAACATGGCACCGAGGTTGGGGCCACAGCAATGTGTGGGACGGTGGGGTGGGCTGGGGCCCTTGGCTCCAAGCATTAGTTCTCCAAGCTCTGGTCCGTTCTCCTACCTCCTTCAAGGGGCACCAGGGCTACAAGGTGGTAGTTGAGTATTGGGGCCCGACTCCTGGGGCACTGGAGTGGTCTCTAGGCCCGAGGCCCCAAGGAGAGGGCTGGGTTTCTGGGAGAGTGCTGGTCCTTCCTCTCTGGGCTTGGCCATCTTGACAGCTTCATCGTAGGAGGGTGGAGGCTCCGGGGTGTACAGGCTGTAGGCAGGAGGAGCCATGGAGTCCAGGTCCAGCTCCCCAAAGGGCAGGGGCAACCGCATGCCCAGTGGGTACTGCACGGAGCTGTAGGAGGTCACAGTGCTGTGTACAGGGCTGTCACTGTCCATAGGGATGACTGCCACGTCGCAGGGCTGCCGTGCTGGTGGCAGATGTGGCTGGGCCTGTGCCTGCTTCCGGAGGCAGCAGAACCGGACACAACCAGCTGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGCCCCACGTGCCACAGGCTGCTCCAGCGGGCCTGGGGCGGGCACTGGTCCGAGGGGTCGCAGCTGCCGTCCGCGAAGCCCAGCGCCACCTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGCAGCAGCCGCAGTCCGCGGGCGGCCAGCGGCCCCCGGGCCATGCTCTGAG +>ENST00000378598 +TTAGTTCTCCAAGCTCTGGTCCGTTCTCCTACCTCCTTCAAGGGGCACCAGGGCTACAAGGTGGTAGTTGAGTATTGGGGCCCGACTCCTGGGGCACTGGAGTGGTCTCTAGGCCCGAGGCCCCAAGGAGAGGGCTGGGTTTCTGGGAGAGTGCTGGTCCTTCCTCTCTGGGCTTGGCCATCTTGACAGCTTCATCGTAGGAGGGTGGAGGCTCCGGGGTGTACAGGCCCACGTGCCACAGGCTGCTCCAGCGGGCCTGGGGCGGGCACTGGTCCGAGGGGTCGCAGCTGCCGTCCGCGAAGCCCAGCGCCACCTGTGGGGACAAGGGTGAGCCCGGGAGGGGCGTGGTCCGAGCAGGGACCCGCCCCGCGGTGGCCGAACCGAGAGAGAACGCCGCCCGACCCACCTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGCAGCAGCCGCAGTCCGCGGGCGGCCAGCGGCCCCC +>ENST00000470931 +GGCACTGGAGTGGTCTCTAGGCCCGAGGCCCCAAGGAGAGGGCTGGGTTTCTGGGAGAGTGCTGGTCCTTCCTCTCTGGGCTTGGCCATCTTGACAGCTTCATCGTAGGAGGGTGGAGGCTCCGGGGTGTACAGGCTGTAGGCAGGAGGAGCCATGGAGTCCAGGTCCAGCTCCCCAAAGGGCAGGGGCAACCGCATGCCCAGTGGGTACTGCACGGAGCTGTAGGAGGTCACAGTGCTGTGTACAGGGCTGTCACTGTCCATAGGGATGACTGCCACGTCGCAGGGCTGCCGTGCTGGTGGCAGATGTGGCTGGGCCTGTGCCTGCTTCCGGAGGCAGCAGAACCGGACACAACCAGCTGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGCCCCACGTGCCACAGGCTGCTCCAGCGGGCCTGGGGCGGGCACCTGTGGGGACGGCGGCACCTGGAGCAGGCGGGGCATGGGACGGCCGACCTCGCCACCCGTGCCTCCCCATAGGGCGGGGCCAGGCCCCGGCTCCCTCCCCCCCGACTTACTGGTCCGAGGGGTCGCAGCTGCCGTCCGCGAAGCCCAGCGCCACCTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGCAGCAGCCGCAGTCCGCGGGCGGCCAGCGGCCCCCGGGCCATGCTCT +>ENST00000602604 +AGGTCCAGCTCCCCAAAGGGCAGGGGCAACCGCATGCCCAGTGGGTACTGCACGGAGCTGTAGGAGGTCACAGTGCTGTGTACAGGGCTGTCACTGTCCATAGGGATGACTGCCACGTCGCAGGGCTGCCGTGCTGGTGGCAGATGTGGCTGGGCCTGTGCCTGCTTCCGGAGGCAGCAGAACCGGACACAACCAGCTGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGCCTAGGAGAGCAAGGCTCTACCACTGGACTGACCCTCGGCCACCGGGCACCTGCACCCTGGGGAATGTCGTGGCACAACCACCGAAGACAGGTTAACAGGATAAAAAGCAGACAATGTCTCTCCATGTCGGAGACCGCCGTGGCCAGAGCCTGGCCTCGGGCTGCTGGGCCTGCCCTGGCTATCTCTCCTGGGCTGGCCAGGGGTGGCCTTGGGCTCACTCCCAGGACTCGCTGTCCTCAGCGAGTGCCCCACTGCTGAGCGGGATCGTAGGGGACTCCCGCGGAGGCCAGGCGGGAGAGGTGGGAGGGAAGGTCCTGCTTGCTCCAGGTCAGTTCCCGCCAGCGGCCGGGACTGGGCGACAGCGGAGGCGGCCTGGTGAGGTAAGGGCCTGGCGGGCCTGGCCCCGGTGACCCCCGCCCCAGAACCGTCGGACGCACGGCTCCGCCGCGGCCTCCACTTACCCCACGTGCCACAGGCTGCTCCAGCGGGCCTGGGGCGGGCACTGGTCCGAGGGGTCGCAGCTGCCGTCCGCGAAGCCCAGCGCCACCTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGCAGCAGCCGCAGTCCGCGGGCGGCCAGCGGCCCCCGGGCCATGCTC +>ENST00000416272 +TGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGCCCCACGTGCCACAGGCTGCTCCAGCGGGCCTGGGGCGGGCACTGGTCCGAGGGGTCGCAGCTGCCGTCCGCGAAGCCCAGCGCCACCTGTGGGGACAAGGGTGAGCCCGGGAGGGGCGTGGTCCGAGCAGGGACCCGCCCCGCGGTGGCCGAACCGAGAGAGAACGCCGCCCGACCCACCTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGCAGCAGCCGCAGTCCGCGGGCGGCCAGCGGCCCCCGGGCCATGCTC +>ENST00000400919 +AGGCAGATTGAAATGCTGACTTTCTCACTGTTTCATTTTGTGATTGAAGTGCGTGCAAAACACTCAATCTGGTAGGGATGATGCCCGCGCGGAGCTGACCCTTCTCCTATTGTTTTTCCAAGCTGGAGAAGAAGCAGGCGCTCCCTCCATTCCAGCCACAGATCACAGACGACTACGGTCTGGACAACTTTGACACACAGTTCACCAGCGAGCCCGTGCAGCTGACCCCAGACGATGAGTGAGTCCCACTGGGTGCGGGTCCCTGGAGCACCCCTCGGGCAGCCCCATGGCAGGCCGGCACCTTGGGCAGCTGGTGACCCAGCCTGCCCTTGAGTCCCACCCGCCTGGTGTCATCTCTCCAGTGGGCGTTGGGGGAGGATTCTTATGCGAACGTGACTCCGCTTCCCCCAAGGGAATGAACACACGGTCACCCCCCTCCCCCCTGCCACCTTTGCCCACAGGGATGCCATAAAGAGGATCGACCAGTCAGAGTTCGAAGGCTTTGAGTATATCAACCCATTATTGCTGTCCACCGAGGAGTCGGTGTGAGGCCGCGTGCGTCTCTGTCGTGGACACGCGTGATTGACCCTTTAACTGTATCCTTAACCACCGCATATGCATGCCAGGCTGGGCACGGCTCCGAGGGCGGCCAGGGACAGACGCTTGCGCCGAGACCGCAGAGGGAAGCGTCAGCGGGCGCTGCTGGGAGCAGAACAGTCCCTCACACCTGGGCCCGGGCAGGCCAGCTTCGTGCTGGAGGAACTTGCTGCTGTGCCTGCGTCGCGGCGGATCCGCGGGGACCCTGCCGAGGGGGCTGTCATGCGGTTTCCAAGGTGCACATTTTCCACGGAAACAGAACTCGATGCACTGACCTGCTCCGCCAGGAAAGTGAGCGTGTAGCGTCCTGAGGAATAAAATGTTCCGATGATGTGGAAGCTCCTCTGATGCCTTTTTTCCGTGAGTGGCGCCTGCCCCACATCTCAGACGCAACCCACACGTAGGGGGGCAGCTTAGGAGCCAGCGGGACACAGGTGGGGGCGGGAGTTGAAGTACCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTCCCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCCATCCAAGCCCGCGCCGGGCGGAAGTGAG +>ENST00000469733 +CAGATTGAAATGCTGACTTTCTCACTGTTTCATTTTGTGATTGAAGTGCGTGCAAAACACTCAATCTGGTAGGGATGATGCCCGCGCGGAGCTGACCCTTCTCCTATTGTTTTTCCAAGCTGGAGAAGAAGCAGGCGCTCCCTCCATTCCAGCCACAGATCACAGACGACTACGGTCTGGACAACTTTGACACACAGTTCACCAGCGAGCCCGTGCAGCTGACCCCAGACGATGAGTGAGTCCCACTGGGTGCGGGTCCCTGGAGCACCCCTCGGGCAGCCCCATGGCAGGCCGGCACCTTGGGCAGCTGGTGACCCAGCCTGCCCTTGAGTCCCACCCGCCTGGTGTCATCTCTCCAGTGGGCGTTGGGGGAGGATTCTTATGCGAACGTGACTCCGCTTCCCCCAAGGGAATGAACACACGGTCACCCCCCTCCCCCCTGCCACCTTTGCCCACAGGGATGCCATAAAGAGGATCGACCAGTCAGAGTTCGAAGGCTTTGAGTATATCAACCCATTATTGCTGTCCACCGAGGAGTCGGTGTGAGGCCGCGTGCGTCTCTGTCGTGGACACGCGTGATTGACCCTTTAACTGTATCCTTAACCACCGCATATGCATGCCAGGCTGGGCACGGCTCCGAGGGCGGCCAGGGACAGACGCTTGCGCCGAGACCGCAGAGGGAAGCGTCAGCGGGCGCTGCTGGGAGCAGAACAGTCCCTCACACCTGGGCCCGGGCAGGCCAGCTTCGTGCTGGAGGAACTTGCTGCTGTGCCTGCGTCGCGGCGGATCCGCGGGGACCCTGCCGAGGGGGCTGTCATGCGGTTTCCAAGGTGCACATTTTCCACGGAAACAGAACTCGATGCACTGACCTGCTCCGCCAGGAAAGTGAGCGTGTAGCGTCCTGAGGAATAAAATGTTCCGATGATGTGGAAGCTCCTCTGATGCCTTTTTTCCGTGAGTGGCGCCTGCCCCACATCTCAGACGCAACCCACACGTAGGGGGGCAGCTTAGGAGCCAGCGGGACACAGGTGGGGGCGGGAGTTGAAGTACCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTCCTTGTCCTGCCTGTCCTCAAGTTATCAGCATGACACAGCGGTGCTGGTGATGGTGATGGTGGAGGTTTCAAAGTTGAACCTGATGAAAACGCTCCACTTCTTCGGAGCCATCTGCTGCTGTGGTGACGGAGTTTTGCTGTGGCGCACAGGTTTCCACTTGTCATAGGAAACTGTGCTTGGTGCATCCCCTGTGCAGCCGGCTGTGAACTGTGGGCTCCAACCCTGCTTGGTTTGCTTCAACTTTCTGAGTGACGTGCAGACCTTCACAGAGGAGCCGTGGGGTGGCTCCATCCAACGCCTCCCTCGCTGCCCCGGTGCAGGCCACCCTGCTGCTCCAGCTCAGTCCAGCACAGGTGTTCTCGCTCTGGGGTTGGCCTGGCGCTGACCTGTGCACCTGACAGGGAAGGTAGGCAGCTCTGGAGCTGGCTGGTGCCCCTCACCTGGGGTGGAGCTGGGGCAGGTCCCACATTTCTCAGAAGGACTCCAGGATGCAGCTGCGTCTGGGGCCTTTTGGAGGGAGTGGCCCAGCTCTCCCGGCCTTTGCCACCCGGCGTCCTGTCCCAGTTTATCTGTGTCCAGTCCGATTGATGGGCTCATGGATTGGAAAGCTGTGACAGACGCCCTGGGCGTGGGGTGGGTGTGATTCTGAGACTAAGGCTCTGGGGGCCGGGCGTGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAGGCGGGCGGATCACGAGGTCAGGAGATCGAGACCATCCTGGCTAACACGGTGAAACCCTGTCTCTATGGAAACTCCCTGTCTTGGGGCCGCGCACACCATGCCTGGCAGGAGCTGGAGATGCAGCAGAGCAGACGCGGCTGCAGGAGCAGCCGTGTTTCCTACAGTGGAGAAGGGGACCCTGGCAGGAGCACTGCCCAGCCAGGCACGTGGTGCTCAACCCTGTGGGCACTGACCCCACAAAAG +>ENST00000414253 +GACTTTCTCACTGTTTCATTTTGTGATTGAAGTGCGTGCAAAACACTCAATCTGGTAGGGATGATGCCCGCGCGGAGCTGACCCTTCTCCTATTGTTTTTCCAAGCTGGAGAAGAAGCAGGCGCTCCCTCCATTCCAGCCACAGATCACAGACGACTACGGTCTGGACAACTTTGACACACAGTTCACCAGCGAGCCCGTGCAGCTGACCCCAGACGATGAGTGAGTCCCACTGGGTGCGGGTCCCTGGAGCACCCCTCGGGCAGCCCCATGGCAGGCCGGCACCTTGGGCAGCTGGTGACCCAGCCTGCCCTTGAGTCCCACCCGCCTGGTGTCATCTCTCCAGTGGGCGTTGGGGGAGGATTCTTATGCGAACGTGACTCCGCTTCCCCCAAGGGAATGAACACACGGTCACCCCCCTCCCCCCTGCCACCTTTGCCCACAGGGATGCCATAAAGAGGATCGACCAGTCAGAGTTCGAAGGCTTTGAGTATATCAACCCATTATTGCTGTCCACCGAGGAGTCGGTGTGAGGCCGCGTGCGTCTCTGTCGTGGACACGCGTGATTGACCCTTTAACTGTATCCTTAACCACCGCATATGCATGCCAGGCTGGGCACGGCTCCGAGGGCGGCCAGGGACAGACGCTTGCGCCGAGACCGCAGAGGGAAGCGTCAGCGGGCGCTGCTGGGAGCAGAACAGTCCCTCACACCTGGGCCCGGGCAGGCCAGCTTCGTGCTGGAGGAACTTGCTGCTGTGCCTGCGTCGCGGCGGATCCGCGGGGACCCTGCCGAGGGGGCTGTCATGCGGTTTCCAAGGTGCACATTTTCCACGGAAACAGAACTCGATGCACTGACCTGCTCCGCCAGGAAAGTGAGCGTGTAGCGTCCTGAGGAATAAAATGTTCCGATGATGTGGAAGCTCCTCTGATGCCTTTTTTCCGTGAGTGGCGCCTGCCCCACATCTCAGACGCAACCCACACGTAGGGGGGCAGCTTAGGAGCCAGCGGGACACAGGTGGGGGCGGGAGTTGAAGTACCCCTCAGGTGAAGGCACAGCTGTCCAGAGCTGAGGCTTCCTAGAGGCAGGGCTGCCAGCTGCCAGGTGTCAGGTGTGGCAGAGCCGTCTTCTGAGCTCCCTGGGAGAGGGGGTCGCGCCACCTCATGCCTCTGAGTGAGGCCTGGTGCACAGGTGTGGAAATTGCCACGCAGCCCTCTTGGCCAGGCGCAGAGACCCCAGGCCTCCATGACTCAGGGGCCGCTCCACCCCATTGTGCGGCTGGTGGCTAAATACTGCCGTGTTGCCAGTAGCGTGCCGGTTACCAGTTTGGCCGTTCTTGTACACAATATGTGAGTAATGCTGTGCTCATCAGAGGGGAGACTTTTATATTCAGTAATTTGTTTTATAAATTAAAGTGAAGGATGTATTGAAGTGTGGTTTGAAAAATCCTGATATTTGCTAATGGCTCCGGTCACGACGGTGTCTTTTGGAAGTGGTTCTCGAAAACTCTGGTGACTTGGGGGCTGCACAGTGGGCCTGCGTGGGCGTGGTGCGGGGCAACTGCCCATGGAGCCCGTGGCTGGCCGGCTCTCCTGTGGATGACACTCACCCTTGACTGCCAGGGTCATTCAAAGTCTTGCACATCCATGAAAGACACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGCCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTCCTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCACCGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAGAAACCAGGGGCGGCCGCCAGAAGGCCCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCCATCCAAGCCCGCGCCGGGCGGAAGTGAG +>ENST00000428120 +GACTTTCTCACTGTTTCATTTTGTGATTGAAGTGCGTGCAAAACACTCAATCTGGTAGGGATGATGCCCGCGCGGAGCTGACCCTTCTCCTATTGTTTTTCCAAGCTGGAGAAGAAGCAGGCGCTCCCTCCATTCCAGCCACAGATCACAGACGACTACGGTCTGGACAACTTTGACACACAGTTCACCAGCGAGCCCGTGCAGCTGACCCCAGACGATGAGTGAGTCCCACTGGGTGCGGGTCCCTGGAGCACCCCTCGGGCAGCCCCATGGCAGGCCGGCACCTTGGGCAGCTGGTGACCCAGCCTGCCCTTGAGTCCCACCCGCCTGGTGTCATCTCTCCAGTGGGCGTTGGGGGAGGATTCTTATGCGAACGTGACTCCGCTTCCCCCAAGGGAATGAACACACGGTCACCCCCCTCCCCCCTGCCACCTTTGCCCACAGGGATGCCATAAAGAGGATCGACCAGTCAGAGTTCGAAGGCTTTGAGTATATCAACCCATTATTGCTGTCCACCGAGGAGTCGGTGTGAGGCCGCGTGCGTCTCTGTCGTGGACACGCGTGATTGACCCTTTAACTGTATCCTTAACCACCGCATATGCATGCCAGGCTGGGCACGGCTCCGAGGGCGGCCAGGGACAGACGCTTGCGCCGAGACCGCAGAGGGAAGCGTCAGCGGGCGCTGCTGGGAGCAGAACAGTCCCTCACACCTGGGCCCGGGCAGGCCAGCTTCGTGCTGGAGGAACTTGCTGCTGTGCCTGCGTCGCGGCGGATCCGCGGGGACCCTGCCGAGGGGGCTGTCATGCGGTTTCCAAGGTGCACATTTTCCACGGAAACAGAACTCGATGCACTGACCTGCTCCGCCAGGAAAGTGAGCGTGTAGCGTCCTGAGGAATAAAATGTTCCGATGATGTGGAAGCTCCTCTGATGCCTTTTTTCCGTGAGTGGCGCCTGCCCCACATCTCAGACGCAACCCACACGTAGGGGGGCAGCTTAGGAGCCAGCGGGACACAGGTGGGGGCGGGAGTTGAAGTACCCCTCAGGTGAAGGCACAGCTGTCCAGAGCTGAGGCTTCCTAGAGGCAGGGCTGCCAGCTGCCAGGTGTCAGGTGTGGCAGAGCCGTCTTCTGAGCTCCCTGGGAGAGGGGGTCGCGCCACCTCATGCCTCTGAGTGAGGCCTGGTGCACAGGTGTGGAAATTGCCACGCAGCCCTCTTGGCCAGGCGCAGAGACCCCAGGCCTCCATGACTCAGGGGCCGCTCCACCCCATTGTGCGGCTGGTGGCTAAATACTGCCGTGTTGCCAGTAGCGTGCCGGTTACCAGTTTGGCCGTTCTTGTACACAATATGTGAGTAATGCTGTGCTCATCAGAGGGGAGACTTTTATATTCAGTAATTTGTTTTATAAATTAAAGTGAAGGATGTATTGAAGTGTGGTTTGAAAAATCCTGATATTTGCTAATGGCTCCGGTCACGACGGTGTCTTTTGGAAGTGGTTCTCGAAAACTCTGGTGACTTGGGGGCTGCACAGTGGGCCTGCGTGGGCGTGGTGCGGGGCAACTGCCCATGGAGCCCGTGGCTGGCCGGCTCTCCTGTGGATGACACTCACCCTTGACTGCCAGGGTCATTCAAAGTCTTGCACATCCATGAAAGACACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGCCTGCCTCAGCCTCTCAAAGGGCTGGGATTACAGGCGTGAGCCACCGTGCCCGGCCTTTTCTTTTGTTGTTGTTGTTGTTGGCTGCCAACTTTGGACTCCGGTGCCTTCGCATTCCCGAGCTGTTTTTGCTTCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTCCTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCACCGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAGAAACCAGGGGCGGCCGCCAGAAGGCCCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCC +>ENST00000400918 +CAGTCCCTCACACCTGGGCCCGGGCAGGCCAGCTTCGTGCTGGAGGAACTTGCTGCTGTGCCTGCGTCGCGGCGGATCCGCGGGGACCCTGCCGAGGGGGCTGTCATGCGGTTTCCAAGGTGCACATTTTCCACGGAAACAGAACTCGATGCACTGACCTGCTCCGCCAGGAAAGTGAGCGTGTAGCGTCCTGAGGAATAAAATGTTCCGATGATGTGGAAGCTCCTCTGATGCCTTTTTTCCGTGAGTGGCGCCTGCCCCACATCTCAGACGCAACCCACACGTAGGGGGGCAGCTTAGGAGCCAGCGGGACACAGGTGGGGGCGGGAGTTGAAGTACCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTCCTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCACCGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAGAAACCAGGGGCGGCCGCCAGAAGGCCCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCCATCC +>ENST00000497675 +GACGTTTCATCACAACACAGAGACAGACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGCCTGCAAGGGAGGGGCCACACTCACTCGGCCACCTCCGCGGCATGCTGGCCGCAGAGAGCACCGTCTGGACCTCCGGGCCCTCTCTGCTCCTGCCGCTGGAGAGGATCCGGCTGGTCAGAAACAAGGGACGGGGCCACCCCAGGGGCTCATGCACCCGGCAGACCACGGTAACCGCCAGTGGTGTTTCCACACCGTGCCCGTGAGGAGGCCACGCCAGGCCCCTGCGTCCGAGCTGGGGGTGGGGAAGCTGTGTCTCAACAAGCCTCTCTATGGGATTCTGGCGCCTGCTCAGCTTGAGAACGCGCTCATCGTGGAGCCCGGCAGACAGGCGGCCTGACCCGGAGAAAAGGCAGGACGGCGGGTGGCCTGCCAGGGAGAGCCGCCGCGGCTGCGTCTACAGGAGGCAGAAGAGTAAACATGGCTGGGCAGTGGATGTGCAGCTCACGTCAGAGAATTGGTGTTTCTGGCGAGGAGGGACCAAGCCTCACCACGGAGAAGGACGCCGTCACCGGCGTGCAGGCTGCCAACCTGCCACTCTGGGAGGCCCCACGCGGCCCCTGCACCTCTCAGGAGGGCGCTGGCGCTGGGATGGTGGCCGGCCAGGCAGGGGTGGCAGGAGAAAACCCATCCGAGTCCTGCAGGTCAGCGCCCTGGGCATCCAGTGGGGCCGGGAGGGGTGTCTGAGCGCAGCCACCTTCTATCCCCGGCCTCATGTGGCCCCATCAGCCCAACTGGAGCGGCTGGAAATGACCATCACCAGGCCTGGCCAAGGTGTGGCCCTGGAAGCCAGGACAGTTGACTTCCGGCCATGACTCCCGGAGAGTGCCGGAGCTGGCGTGCTCAGCAGAGCTGCCGGGGACGATGTCCCGGGGCTGAGTGGGCGGCTTCAGCCTAGACTTGGGCCTAGATCTTGCTGGAGGCCAAGTGGTCAGTGTCCCATCAGAGTGACCATCCCTCACACGCCACTGCTGGGGGACACACCCCCACTGAGCGGCCAAGTCCACAGGACACGTGTCCCTGTGTCCACCTGTCAGCCACACCGCCCCTCGCTCCCCTACAGCCTCTGCCCTCAGACCAGTCCACGGCGCGCCGTTTTACCCTTGGGCTTTGCTGTGTCCCTTCCTTTGGCTCCTGTGCCCCGTCTGTGTGGCCACTGCAACCCTCAAGTCCCCCTCTCCAGACCATAGCTGGACCCCCACTCCCGGGGCTGGCTCCAGCAGCCATCAGCTGCCTTCTCACTCTGGCAGAGCCCACCCAGTGCCTTCTGAAGCCCCCGAGGGTCACTCAGTCTGAGACTTTCCGGCTTCTGCCCATCCTGGGAACCAGCCCCTCCCTCCAGAAGCTTTCTCTAAGGTTGCCAGAAGGTGCTAAGATCTGAACCGAGGTCATCTTGTCCCGGGGTTTCCAGGCAGCGTCCCTTGTTTGGGGGCCCTCTGAGATGCCTTCAGACCCCCGCCTGTGGCGGAAGAGCTTTGTCCTGGCCTGATCTGCCCTGTCCGTGACGCTTCTGCTCAGTAGCTGAGCACGCCCTGTGGTGTGGACAGGCCAGCCCGGCTGCAGGACAGTGGGGGCTCAGTCCAGAAGCCTCTGGTGGCTTCTGCGTGTGGGCAGGGGAGCAGGGCTGCAGGGTGGGCTGGCACCTGGCAGCGTGAGGGGCCTCAGGGCTGTTAAAATCCCAACGACCGGCCGGGCGCGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAGACGGGCGGATCACCTGAGATCAGTTCAAGACCAGCCTGACCAACATGGTGAAACCCTGTCTCTACTAAAAATACAAAAATTAGCCAGGTGTGGTGACGCCTGTAATCCCAGCTACTCAGGAGACTGAGGCAGGAGAATCGCTTGAACCCGGGAGGCAGATGTTGCAGTGAGCCGAGATCATGCCACTGCACTCCAGCCTGGGCGACAGAGCGAGACACCGTCTCAAAAAAAAAAAAAAATCCCAGTGACCAACCCAGGGCCTCGCCACATCAACAGAGACAAAACGCAGCTCTGGCTCTCAACATCCTCACCCCTCACCAGGTGCCCAGCTTCCCATCCACCCACGTGACCCGCAGGTGTCTGAAAATGCACAAAATGTCCAAATAGGACCACAAGAAGATCTTAAAGACACAAAGAACATTCTACATAGTTTGTCAAATCCAGCATTTGACGGTCCTCTGGGTGACCCGGAGAACACCAAGGCTGTGAGAAATGGGAGGCCTCCTGGCAGCTCCACTCCCCAGACCCGCCTCTGCCAGGGCTCCAGGCTCAGCAGGCGCCTGTGCGGGACAGGGCGACGGTTCAAGACCAAGTCCGGCTGTTAGACCAGACCCTCCAATCCAGGCGGCCTCCCTGCTGGGGTCCTGTGCGGTCAGGAGTCCCAGGGCATCCCAGGGTGGCTGTGCAAACCCTTGTTCCCAAAGATATGGGGCTTGTCCCCCAGCTAGCCTGCCCATGCGGTGGCCACAGCCTCGGGTGAGTTCCGGTTCCAAAGTACCGGCTCTCCCTTACGATCAAGTGTTCGAATGTGCTTGAAGCATTCCAGACACACCAAGGCCTGGACCTGACTTCATTGACGCCTACTTAGGAAAAATTGAGGCAGTCTGCCAAGCTTTCAGCAACTGCTTAAAAAGCTCAAAATGGCAAGTTTTTCCTCGTGAACGTCCTTGTCTTCAGAAGTCTTTTTTTAGACTATCTGGAAAAGCAGGCGATGCAAAGACAAAAGCCCCTCCCCGGGGGGCGGGGGGCAGCACCCTGACAGCAACAAGGATCTCAGAGCTTCAGCCAAGAGCATGGATTTCTCCCCAGGGCTCCCAACAGTACCCTCTGTCCGTGATTCAGGGTCTTACTCTGTCACCCAGGCTGGAGTGCAGTGGTGCAATCATACTTCACTACAGCCTCCAATTCCTGGCTCAAGGGAATCCTCCCACTTCAGCCTCCAGAGTAGCTAGGACCACAGGCACGCGCCACCACGCCCAGGCATGTAAAGATGGGATCTTGCCATGTTGCCCAGGCTGGTCTCAAACTCCTGGGCTCCAGCAACCCACCTGCCTCAGCCTCTCAAAGGGCTGGGATTACAGGCGTGAGCCACCGTGCCCGGCCTTTTCTTTTGTTGTTGTTGTTGTTGGCTGCCAACTTTGGACTCCGGTGCCTTCGCATTCCCGAGCTGTTTTTGCTTCTGGAAGACCAGGGGCATCAGGCATGACTGAAGGACCTGGTCTCCATAAGCTCTGAAACCTGCCGCCCATTAACTCAACCAAAAGTTACGAACCAGCATCATTCACACCACCCCAGCCCCAGGACCTGCTCCGGAGGCCAAGGGCCCAGAGGTCGCCAGACACAAGGCCAGGCACTGGGCAGTTTGGGTTATCTTGTTAGCAAAACTGGGTTCCATTCCCCTTTACTTAAAAAATACATAAAAATATACGTTGGGTTTCAAAAATAAGAAAAAGCATCTCCAGACAAAAAAGACGATCTTCATTTTTAAAACCCATGACGCACTCTCGGGAAGGTGTTCCTGTGCTCTGGGCCTGGGGACGCTGGTGCCACCAGATTCCAGGATGGCCAGGTGGACCCGGGGCCAGTGCTCCCAGCCTTCCTTCTGTGCTGTTCTGTGGGCCCCCAGCCTGCCCTGCCCACAGAGCACGGCAAGCAGGTGGACCCCAGACCCGTGACAGAGAGCCACCTGGACATGCCAGGCCACAGCACTGGGCCACCTTTCCAGTGTGAAACAGGGCTTTAAAAGCCAGCGCTGAGCTCGGCCACCTCTTGACCTTCTGAACGGCTGTGGTTTCCAAACACGGATGGATAACCGGGCCGGGCGCAGGGGTGGCCTACTCACCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTCCTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCACCGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAG +>ENST00000378546 +TTTCATCACAACACAGAGACAGACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGCCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTCCTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCACCGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAGAAACCAGGGGCGGCCGCCAGAAGGCCCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCCATCCAAGCCCGCGCCGGGCGGAAGTGA +>ENST00000378543 +TTTCATCACAACACAGAGACAGACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGCCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTCCCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCCATC +>ENST00000401813 +TTTCATCACAACACAGAGACAGACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGCCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTCCTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCACCGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAGAAACCAGGGGCGGCCGCCAGAAGGCCTTGTCCTGCCTGTCCTCAAGTTATCAGCATGACACAGCGGTGCTGGTGATGGTGATGGTGGAGGTTTCAAAGTTGAACCTGATGAAAACGCTCCACTTCTTCGGAGCCATCTGCTGCTGTGGTGACGGAGTTTTGCTTTATTGGAAAATAATTTCTGGTTGGGACTGACACGTGCACAGTGGAAATGAGTTTTTTCTAAGCCAAAATTCATGTTTACAAAAGAACGTTTCAGCTGTGGGAGTTTGCATCCCAGGCAGAGCAGAAGGTGATCGAGTGGGTGGGGGCATCAGAGCCACCCATCTCCTACTCCCGCACCTGCAGACCGGTGGGCTAGGAGGCCCCTTACCCTCTGTGGCAAAAAAGGACACATTTATGGATGATGAATCAGGCCCCAGCCCACTGAGCTGGTTTCAGAAGCCAGGCTGGCCGTAGGTCAGGGAGCCAGGCCTCTCCAACTCCTTCCACCGCGGAAGAACAAGTGTCCCAGCCACTGGCATCCTCAGAGTCACCCAAATGTTCATCTCTGCCCAGCGCTGACACCCTGCAAATCAGGCTAAGACAGCGGTGACGGGCCCTGAGGCTGGCAGGCCTAAGCAGCCCGGTGGCCGTGCACCCTCCCAATTTCCAAATGAGACCTGTGGCCGACAGGCACCCTGGGCACATGCTGAAGGCACTGGGCTGCCTCCACCCCTTCCCATGTGGCTAAATGGCCCAGCACCCACACACGGTGCCCTGGCAGTGCTCACCTGCTGGCAAGGACAGCCAAAAGGCCCGGGCAGCCTTCTGACGCAGCCAGGAACTGGGCTGTGCTCCACCACACCTGCTGGCCCGTGGATGCCAGGCAGGCACGCCCACCCATAGCCAGATGTGGTGGCATTTATGGGATACGGGAGTGCCAGGCAGACAGGCTGTGAGAGACAGTTGCCTGGGAAACATCGCCAGATCTTTGGGGCAGCAGAGCAGGTGCTCGGGCCCACACATGGGGTGCAAGAGTAGGGGTGTGCCTTGGTGCCCTTGGGCACCGACAGCCTCCTCACAGCCTCAGTGGCGGGGTCATGGCACAGGCCTGCCCCTGACCCCAAGAACCAGAAAGCCAGGAGCAGCTGGGGAGGGCCCTGGCCCGGGAGAGACAGCGGTCCTGTTTCTGAACCCCATCCCAGCCATGGCCTGTGTCTGGGCCAGCATCCCCGACCAGACAGGGCCAGCCGCCCTCTCTCAAAGTCCCCAGCACCCCTTCAAGCAGTATCCGGTTCACACCCTCCCACAGCCTGTCCTCCATCCCCACGTGTCGGGCTCAGCTTCCGCACCACTCAGCCCCCACCCAGGGGCGGGCTTTTATCAGCCCCAGATCCTGCTCTGACGTCCCCCCGCCCGGAGAAGCTTCCCCAGCCCAGCCCAGCCCAGCCCAGCCCAGGCTTCTCTCTCCACCCCACTGCCCTGCTGGGAAATTGTGAGCTCAGATGCTGATTGGTCTACCCAGGAGGGCGGTCCTGTGTGCTCTGTTCCCTGGGAAGCCTCTCAGAGTGCGCGGCACCAAGGAGCCGGTCAGGGAGTGGAGACCTCTCAGGGCACCCCTCCTCTGGGGAAGGCAAGTCACAGAAACCAAGCTGGAGGAGCACTGTGGGTTGAGCAGCGTCTCCGAAGACTCATGTCCACCAGTACCTGAGAAAGTGGCCTCGCTCGGAAGCAAGGTCTGTGCCGATATAATCAAACCAGGATGAGGCGATACTGGGTTAGGGTTGGCCCTGAATGCAGTGTGAGCAGTGTTCTTGTAAGAAAAGGAAAATTGTCCGGGTGCAGTGTCTCACGCCTGCAATCCCAGCACTTTGGGAGGCCGAGGCGGGCAGATCACTTGAGGTCAGGAGTTCTAGACCAGCCTGGCCAACATAGTGAAACCCCG +>ENST00000487186 +TTTCATCACAACACAGAGACAGACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGCCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTCCTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCACCGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAGAAACCAGGGGCGGCCGCCAGAAGGCCTTGTCCTGCCTGTCCTCAAGTTATCAGCATGACACAGCGGTGCTGGTGATGGTGATGGTGGAGGTTTCAAAGTTGAACCTGATGAAAACGCTCCACTTCTTCGGAGCCATCTGCTGCTGTGGTGACGGAGTTTTGCTGCTGGCAAGGACAGCCAAAAGGCCCGGGCAGCCTTCTGACGCAGCCAGGAACTGGGCTGTGCTCCACCACACCTGCTGGCCCGTGGATGCCAGGCAGGCACGCCCACCCATAGCCAGATGTGGTGGCATTTATGGGATACGGGAGTGCCAGGCAGACAGGCTGTGAGAGACAGTTGCCTGGGAAACATCGCCAGATCTTTGGGGCAGCAGAGCAGGTGCTCGGGCCCACACATGGGGTGCAAGAGTAGGGGTGTGCCTTGGTGCCCTTGGGCACCGACAGCCTCCTCACAGCCTCAGTGGCGGGGTCATGGCACAGGCCTGCCCCTGACCCCAAGAACCAGAAAGCCAGGAGCAGCTGGGGAGGGCCCTGGCCCGGGAGAGACAGCGGTCCTGTTTCTGAACCCCATCCCAGCCATGGCCTGTGTCTGGGCCAGCATCCCCGACCAGACAGGGCCAGCCGCCCTCTCTCAAAGTCCCCAGCACCCCTTCAAGCAGTATCCGGTTCACACCCTCCCACAGCCTGTCCTCCATCCCCACGTGTCGGGCTCAGCTTCCGCACCACTCAGCCCCCACCCAGGGGCGGGCTTTTATCAGCCCCAGATCCTGCTCTGACGTCCCCCCGCCCGGAGAAGCTTCCCCAGCCCAGCCCAGCCCAGCCCAGCCCAGGCTTCTCTCTCCACCCCACTGCCCTGCTGGGAAATTGTGAGCTCAGATGCTGATTGGTCTACCCAGGAGGGCGGTCCTGTGTGCTCTGTTCCCTGGGAAGCCTCTCAGAGTGCGCGGCACCAAGGAGCCGGTCAGGGAGTGGAGACCTCTCAGGGCACCCCTCCTCTGGGGAAGGCAAGTCACAGAAACCAAGCTGGAGGAGCACTGTGGGTTGAGCAGCGTCTCCGAAGACTCATGTCCACCAGTACCTGAGAAAGTGGCCTCGCTCGGAAGCAAGGTCTGTGCCGATATAATCAAACCAGGATGAGGCGATACTGGGTTAGGGTTGGCCCTGAATGCAGTGTGAGCAGTGTTCTTGTAAGAAAAGGAAAATTGTCCGGGTGCAGTGTCTCACGCCTGCAATCCCAGCACTTTGGGAGGCCGAGGCGGGCAGATCACTTGAGGTCAGGAGTTCTAGACCAGCCTGGCCAACATAGTGAAACCCCGTCTCTACTAAAAAACACAAAAATTAGCTGGGTGTGGTGGTGGGCGCCTGTAGTCTCAGCTACTCGGGAGGCTGAGGCAGGAGAATCGCTTGAACCCAGAAGGCAGAGGTTGCAGTGAGCCAAGATTGTGCCATTTTACTCCAGCCTGGGCAACAGAGCAAGACTCCGTCTCAAAAAAAAAAGAGAGAGAGAAAGAAAAGGAAAATTGGCCAGGTGCTGTGGCTCATGCCTGTAATTTCAGCACTTTGGGAGGCCGAGGCAGGTGGATCATGTGAGGTCAGGAGTTCGAGACCAGCCTGAAAGACATCGTGAAACCCCATCTCTACTAAAGATACAAAATTAGCTGGGTGTGGTGGTGGGCACCTGTAATCCCAGCTACTTAGGAGGCTGAGGCAGGAGAATCGCTTGAACCCAGGAGGCGGAGGTTGCGATAGGCCGAGATCGTGCTGTTGCACTCCAGCCTGGGCGACAAGAGCAAAACTCTATCTCAAAAAAAAAAAAAAAAAGGTAAGGAAAATTTGGACACAGAGACACAGGAAGGAGGCTTTGGGGTTGGGGGTGGAGCAGCTGCACGCCAGGGAATGCCGGGGGCCCGGGGCTGGAAGGGGCAGGCAGCAGCCACCCAGAGCCTTTAGGCGGAGCTCCACCCTCCCAACCACTGATTTTGGACACCAGCTGCCTGAACTGTGAGAATATACATGTCACTCGTTTTAGGCTCCCAGTGTGTGGTCATTTTTTCACAGCAGCCCCAGGAGACACGCAGCAGGCTCCCGGCTTTCCAAGCCGCCACGCACCAAGTTCAGCTTGAAAACGCTGAGCCCAGCTGGGTGCGGGGAGCCCTCGGTCTCCTGTCCACCACACCCGGAGCTGAGGAAGAGGCTCCCCCATGGGCCAAGAGCTGGAAGGGGGCCCTTGGAGGATCCCCCAAGGTCCTCCAAGTGGGCCAGGAAACCTCTGCAGGTGGAGAGGGTGGCTGGGACCCCCTCGGGAGTCCCCAGGGAAGGTCTGGCTTCTCGGCTCTGTAGAATCAGCTTTGTCCCCAGTTCAGCACGTTTTTATGGGAAATCTGCTGGCTGGGGACAGCCCTTGATGTCCTGAGATGAGATGCTGCCTGGTCCCTGCACCTTCCAGGACCCAGCTCACCTGTGGCGCACAGGTTTCCACTTGTCATAGGAAACTGTGCTTGGTGCATCCCCTGTGCAGCCGGCTGTGAACTGTGGGCTCCAACCCTGCTTGGTTTGCTTCAACTTTCTGAGTGACGTGCAGACCTTCACAGAGGAGCCGTGGGGTGGCTCCATCCAACGCCTCCCTCGCTGCCCCTGGGGTGGAGCTGGGGCAGGTCCCACATTTCTCAGAAGGACTCCAGGATGCAGCTGCGTCTGGGGCCGAGAGAAGGAAGGACGCTGCCCCCAAGGACAGACGGGCAAGCTGGAGTCAGGAGAGGCGCAGCCGTGGCCCACAGGCCTTGGATCTCTCCAAGGCCTGGGCGGCAGGAAAGGGAGAGATGACGTCATTGCCGCCTGGAATCTGCTGTTTGGAGGCGTCGCCATGGAGACCGGAAGGCTCAGGGTGGGTAAAAATAGCAAACCCAAAAGGGTGTAAGTTCCAAGAACGCGAGTCTCTGAAAAGCGAGGCATCCATGTTC +>ENST00000476803 +GACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGCCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTCCTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCACCGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAGAAACCAGGGGCGGCCGCCAGAAGGCCTGGGGCAGACAGAGAGGGCAGACAGGGGGTACTCAGTAGCGGAAACGCTATGGTGGGGAGACCCGGGAGGGCCTGGGGC +>ENST00000440825 +GCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGCTCTGTCACCCAGGCTGGAGTGCAGTGGTGCAATCATACTTCACTACAGCCTCCAATTCCTGGCTCAAGGGAATCCTCCCACTTCAGCCTCCAGAGTAGCTAGGACCACAGGCACGCGCCACCACGCCCAGGCATGTAAAGATGGGATCTTGCCATGTTGCCCAGGCTGGTCTCAAACTCCTGGGCTCCAGCAACCCACCTGCCTCAGCCTCTCAAAGGGCTGGGATTACAGGCGTGAGCCACCGTGCCCGGCCTTTTCTTTTGTTGTTGTTGTTGTTGGCTGCCAACTTTGGACTCCGGTGCCTTCGCATTCCCGAGCTGTTTTTGCTTCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTCCCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCG +>ENST00000420515 +TAGGACCACAAGAAGATCTTAAAGACACAAAGAACATTCTACATAGTTTGTCAAATCCAGCATTTGACGGTCCTCTGGGTGACCCGGAGAACACCAAGGCTGTGAGAAATGGGAGGCCTCCTGGCAGCTCCACTCCCCAGACCCGCCTCTGCCAGGGCTCCAGGCTCAGCAGGCGCCTGTGCGGGACAGGGCGACGGTTCAAGACCAAGTCCGGCTGTTAGACCAGACCCTCCAATCCAGGCGGCCTCCCTGCTGGGGTCCTGTGCGGTCAGGAGTCCCAGGGCATCCCAGGGTGGCTGTGCAAACCCTTGTTCCCAAAGATATGGGGCTTGTCCCCCAGCTAGCCTGCCCATGCGGTGGCCACAGCCTCGGGTGAGTTCCGGTTCCAAAGTACCGGCTCTCCCTTACGATCAAGTGTTCGAATGTGCTTGAAGCATTCCAGACACACCAAGGCCTGGACCTGACTTCATTGACGCCTACTTAGGAAAAATTGAGGCAGTCTGCCAAGCTTTCAGCAACTGCTTAAAAAGCTCAAAATGGCAAGTTTTTCCTCGTGAACGTCCTTGTCTTCAGAAGTCTTTTTTTAGACTATCTGGAAAAGCAGGCGATGCAAAGACAAAAGCCCCTCCCCGGGGGGCGGGGGGCAGCACCCTGACAGCAACAAGGATCTCAGAGCTTCAGCCAAGAGCATGGATTTCTCCCCAGGGCTCCCAACAGTACCCTCTGTCCGTGATTCAGGGTCTTACTCTGTCACCCAGGCTGGAGTGCAGTGGTGCAATCATACTTCACTACAGCCTCCAATTCCTGGCTCAAGGGAATCCTCCCACTTCAGCCTCCAGAGTAGCTAGGACCACAGGCACGCGCCACCACGCCCAGGCATGTAAAGATGGGATCTTGCCATGTTGCCCAGGCTGGTCTCAAACTCCTGGGCTCCAGCAACCCACCTGCCTCAGCCTCTCAAAGGGCTGGGATTACAGGCGTGAGCCACCGTGCCCGGCCTTTTCTTTTGTTGTTGTTGTTGTTGGCTGCCAACTTTGGACTCCGGTGCCTTCGCATTCCCGAGCTGTTTTTGCTTCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTCCTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCACCGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAGAAACCAGGGGCGGCCGCCAGAAGGCCCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCCA +>ENST00000514625 +TGGTGGAGGTTTCAAAGTTGAACCTGATGAAAACGCTCCACTTCTTCGGAGCCATCTGCTGCTGTGGTGACGGAGTTTTGCTGTGGCGCACAGGTTTCCACTTGTCATAGGAAACTGTGCTTGGTGCATCCCCTGTGCAGCCGGCTGTGAACTGTGGGCTCCAACCCTGCTTGGTTTGCTTCAACTTTCTGAGTGACGTGCAGACCTTCACAGAGGAGCCGTGGGGTGGCTCCATCCAACGCCTCCCTCGCTGCCCCGGTGCAGGCCACCCTGCTGCTCCAGCTCAGTCCAGCACAGGTGTTCTCGCTCTGGGGTTGGCCTGGCGCTGACCTGTGCACCTGACAGGGAAGGTAGGCAGCTCTGGAGCTGGCTGGTGCCCCTCACCTGGGGTGGAGCTGGGGCAGGTCCCACATTTCTCAGAAGGACTCCAGGATGCAGCTGCGTCTGGGGCCTGAGCGGAGGGAAGATATCAGGCTGGGGCCGGCTGCTGGGCCTGTCCTCTCTGAGTTGCCTCAAATCCCCTGTTCCTTGAGCGGTCCTGGAGCCTGGCCTCAGGCCTCAGGGCACCACACTACTTGCCTCCAGGGACCAGCCTGTTCACCCCACACCCAGCCCTGTGACAGAGGTGCTGTCGCGTGGCCCCACTTACAGATGGGTCAACTGAGGCCCGGGGCATCTGTCCACTTGTCATGACAGTGAGCGG +>ENST00000420964 +TGCTGGGATTACAGGCGTGAGCCACTGCGCCAAGAGCAAGCTTCTGATGTAGGGGCTGCGGGGGGCTTCCCAGGCCAGGCAGGTTGCTGTCTCAGCGCCAGCGTGTAGCCTCCTCCCAGGATCCGGAGCAGGAGGGTGGCTGTCTTTTGCGTTCAATCCGCTGGGCTGCTGTGGGGTTCCCGCAGAGCTGCTCCAAGGGGCCGAGAGAAGGAAGGACGCTGCCCCCAAGGACAGACGGGCAAGCTGGAGTCAGGAGAGGCGCAGCCGTGGCCCACAGGCCTTGGATCTCTCCAAGGCCTGGGCGGCAGGAAAGG +>ENST00000378322 +TAGTTGTATAAATCAGCAAGTATTTATTTTAAATAATAAAACTACAGTTTTATACCATACATATTTACAAAAATGCTTTGCTATAGAAAAATAGAATCAATCACTGAATCCAGACCACCACAGTGGAGAACCTCCTGGTGAAGCTGTGTTTTTTCCCACACTGGAAACACAGAGTAGCCCTGTTTCTGCACACGTTAGTGCACCGCTGCTACGTGTGGCCGCCCAGCTGTCTGCAGGCTGTGCCGACCACTGCCTCTGTCTCCAGGAAGCAGAGGCAGAAGTGATCCTTGCTGAGGAGGGCCATCGAGTCTCCGCTTAAATGCCAGCACAGAGAGAGCACTGCAAAGTCGCCTAGAGAGAGACAGGTGGCCAGAGGATTACAGCAGGGGAGGCCCAGATTCTGGGGGATGGGCACCCCCTTGTCCTGCAGGCCAGCACAGTGCCTGGAGTGACCCACATAGGCAGAGCCAGGGTGGAGCCCCAGAGCTGCCTCAAGTCAGGGAGAGGCTGCTTCTAGCCCATAAAGCTGAGGGCAGCGGGTCCCCTGTGTGTCCGTCTTGAGGTTTACGCAAAGACTCTGAGGGCAGTTTCCCTGGAGTGCTGCCGGAGACAGCAGCTGGGCTTCAACAGTTCAGCCCGTGTGATGCCAGACTGCACACAGCAAGGCTGCCACGTCCGTGGCCTCGGGGATGTGCTTACCTTCCCCAGGCACCTGCACCGACATGCAGCCCGCTGGGGACCACAGGTAGAGCCTGCTGCCTCCCGTGCAGATGGCCAGCCGCGGCTGCTGCGGGTCCCACTGAAATGCGCGCACTGGGGACAGCTGCTCGAGCACCGCGAACAGCCTCAGCTTCTGAATGTCCCAGACCCAGACGGCATTGGGAATGTTGTCGTTCCTTGTCGCCAGGAAGTAGCTGTCAGGACTAAATGCCAGCATTCCTATGCCGATTTTCGGGTTTGCTCTGTCGGTAACAGGTTTCAGTGTCTGTAAGGAGACTGGGACAGAGGCGATCTCATATTTACTCTCTGAGCTCGGGAGAGGGCCGGCCCCGGCCCGGGGCGGCGGGAAGGAGAGGCAGCCCAGTCCCAGCTGTGGGCTCTTCTCGGCCTCCTTATACACCACTATCTTGGGATCATTAATGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCACCTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTTGATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTACAGCAGAATCTTGTACTCCAAGCAGGTGTCCCACACTGCCAGCACACAGCCGTTTGGGGCCCACTCAATCCCTGTGAGATCCTGGGTGTCCGTATCAAAATGCCGCAGGAGCTGCCAATCACTGCAGACGAAGATGCTCACGTAATCTTTGCAGTCGCGCCGTTCTGCCAGCGCCATGTAGCGGCCGTCCCTGGTGAAGGTGATTCCCTGCAGACAAGCTTTCGGGTATTTGATGTAAGACACGGATTTTGTGCACAAGGACCAGACGGTTATCCGCAGATGGAATTCCGTGGTGTTGAGAATGTGGCGCCCGTCCGGGCTCCAGCACGAGGCCACCAGCCCGGCTGAGCCCTCGTCTATTTTGCAGTGCCATTCGGGCTGCTCTAAAGACCAGACCTGCACCAGCCCTCGCTTGTACATGGCGCACAGGATGAAGAGCGAGTCTGCCGACCACTCGATGTGCTGGATCTGGTCTAGGCACGTGTACAGCTGAAGGATCTGAAGGGTGTTCACATCCCGGACCACTAACCGGTACTGGACACAGGAAGCCAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGAGAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCCTGCGCCCGAAAACCCGCGGGACCCCTGGGCGC +>ENST00000270708 +TAGTTGTATAAATCAGCAAGTATTTATTTTAAATAATAAAACTACAGTTTTATACCATACATATTTACAAAAATGCTTTGCTATAGAAAAATAGAATCAATCACTGAATCCAGACCACCACAGTGGAGAACCTCCTGGTGAAGCTGTGTTTTTTCCCACACTGGAAACACAGAGTAGCCCTGTTTCTGCACACGTTAGTGCACCGCTGCTACGTGTGGCCGCCCAGCTGTCTGCAGGCTGTGCCGACCACTGCCTCTGTCTCCAGGAAGCAGAGGCAGAAGTGATCCTTGCTGAGGAGGGCCATCGAGTCTCCGCTTAAATGCCAGCACAGAGAGAGCACTGCAAAGTCGCCTTCCCCAGGCACCTGCACCGACATGCAGCCCGCTGGGGACCACAGGTAGAGCCTGCTGCCTCCCGTGCAGATGGCCAGCCGCGGCTGCTGCGGGTCCCACTGAAATGCGCGCACTGGGGACAGCTGCTCGAGCACCGCGAACAGCCTCAGCTTCTGAATGTCCCAGACCCAGACGGCATTGGGAATGTTGTCGTTCCTTGTCGCCAGGAAGTAGCTGTCAGGACTAAATGCCAGCATTCCTATGCCGATTTTCGGGTTTGCTCTGTCGGTAACAGGTTTCAGTGTCTGTAAGGAGACTGGGACAGAGGCGATCTCATATTTACTCTCTGAGCTCGGGAGAGGGCCGGCCCCGGCCCGGGGCGGCGGGAAGGAGAGGCAGCCCAGTCCCAGCTGTGGGCTCTTCTCGGCCTCCTTATACACCACTATCTTGGGATCATTAATGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCACCTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTTGATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTACAGCAGAATCTTGTACTCCAAGCAGGTGTCCCACACTGCCAGCACACAGCCGTTTGGGGCCCACTCAATCCCTGTGAGATCCTGGGTGTCCGTATCAAAATGCCGCAGGAGCTGCCAATCACTGCAGACGAAGATGCTCACGTAATCTTTGCAGTCGCGCCGTTCTGCCAGCGCCATGTAGCGGCCGTCCCTGGTGAAGGTGATTCCCTGCAGACAAGCTTTCGGGTATTTGATGTAAGACACGGATTTTGTGCACAAGGACCAGACGGTTATCCGCAGATGGAATTCCGTGGTGTTGAGAATGTGGCGCCCGTCCGGGCTCCAGCACGAGGCCACCAGCCCGGCTGAGCCCTCGTCTATTTTGCAGTGCCATTCGGGCTGCTCTAAAGACCAGACCTGCACCAGCCCTCGCTTGTACATGGCGCACAGGATGAAGAGCGAGTCTGCCGACCACTCGATGTGCTGGATCTGGTCTAGGCACGTGTACAGCTGAAGGATCTGAAGGGTGTTCACATCCCGGACCACTAACCGGTACTGGACACAGGAAGCCAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGAGAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCCTGCGCCCGAAAACCCGCGGGACCCCTGGGCGCGCAGCAGGCTGCAAC +>ENST00000471223 +TTTTTTTTTTTTTTTTAGCCCTTTACAAATGGAGAAACCCTTAACAAAAGGCGGGCTGCAGTGTGCCCAGCCCTGCTTTCTACTCAGCAGAGTGGAGCAAGTGAGCAGGGTGGAGGCCTCCTGACTCATGCGCGGACCTGCGGCTGCTGCAGGACAAAGGCCCAGCGCCTCCAAGGAGCTTCTGTGAGCACCTCGGCTACTGCAGAAACGTGAAAGGAGGTGACGTGTCGGAAACCCCCAACTTCATTTTCTTTTCCAGTCGCTTCTACACCTGGGGCCACAGGACACAGTAAAGGGTGAGACAGCACCTGCGTCAGCACAACTGACCGTTCCTTGTCGCCAGGAAGTAGCTGTCAGGACTAAATGCCAGCATTCCTATGCCGATTTTCGGGTTTGCTCTGTCGGTAACAGGTTTCAGTGTCTGTAAGGAGACTGGGACAGAGGCGATCTCATCTAGAACACCAACAGGAAGAACACGCCATTGTCACCCTTTCGGGAAGTACGCACGCGGCTGAGAGGCTGCTGTGCCTGCATCGGGCATCGCGAACCCAGCTCCTCTGTTCAAAGGGGAGGAAAGTGCGGCCCAAGGGCAGGAAGAGCTAAGCAAAGCCTGGCAGCCGCAGCGAGGGGCCTGCCCGCAAGTGCCCCGGATGAGAGTGGCACCATCACCTGCCAGGCCCGACTAGGTGGGGGGTGGACCCCACGTGCCAGGGGCTGACTGGAGAGGGACATGGACAGGTCCTAGCTGCAATCTCAGCAGCTCCAACTCCTCAGCACTTTTCTGTCGACTACCAGCATCTGAGTTCACAATCCCTTCCACCTCAGCGTCAGTACCCTTAGACTTTCCGGCTGTGGAAGAACCATCATCACAGCAGAAGCAGGGGCTGTGGAACAAGGACGCCCCTGGGCTCCTGGGGAGCGCCTCCTGTGTGCCAGGCTGCACCTGTCCTGACCCCCATCCTGAGCACACACCGAGCCCCGGGGTGGGCCCGTCGGCACTTGGGGCACCGCTTCCTCTACCTGCAACCTTCAGATGCCCTCATGCCCCTGTGGGATGGGTGCTTTTACTATGCCCATTTCAGCGATGAGGAAACAGACACATAGGAAATGCCCAGAGTCAAGAGGCTGCATCAGAACCGGGCCTCAAGCCGGAGACAGCGCTCGGGAGCACCGCCGGGTTCCAGACCCACTCTGAGCGCCACCCACGGAAAAGTGTTTCTTTGAAAAACATCATTCTCGGAGCTCCGGAAAAACATCCCCTCGGAGCTCCCGCTGTCAGATCCGGGTCTCCAGGGCTCATATTCAGTAACAGAAGCCGCACCTTCACGGCCCACTGCGCAATTCAGACCCTAGTCAACCTCCAGCCAACAGGCTGAGGGGCACACTGGCTGGAAGCATGGAAGGGAAAAAAAGTTTTTTTTTTTAAACATAAGGAACATCCGAAGTTTATCTGGACAACGAGGAATCTTGCATTAAAAAAGGAAAACAAATGACATCACATGTGCTACTTACATTTACTCTCTGAGCTCGGGAGAGGGCCGGCCCCGGCCCGGGGCGGCGGGAAGGAGAGGCAGCCCAGTCCCAGCTGTGGGCTCTTCTCGGCCTCCTTATACACCACCTGAAAGACACAAGGTGGCCACGCCCGGCTCAGGACAGGGACCCGGAAGCCAAGGATGGACGTGGCAAATGCCCATGACAGCGCATGGTCAACAGGTGTGCCTGCCATGACAGCTGGTCCTGCTGCCACCGGGAGAGACGGAAGCACGAACCCCGCAGTCCCGAGAGCTGAGATCACCCAGCCACCCTCTCTCGTGTCCTGCTGAGGAGCCCACCCTTTGAGACACAGGCAGCAAATGTGTGCCCTGTGATTACAGACGGGAGACCACTGCAGCCACCATCATCCAGCAAGGGAGTGGGCTCAGCCTTCCCTCCGTGATAAGAGGATACAGAGAACACTTGCACCAACACAGCAGAGGCCCCGGGAGCAGCAGACACAGACCCGAGGTGGGGGCATCTGTGCCCGAGAGCCTGGCAAGCAAAGGACAGCGGCCCAGGCTCAGTGGAAGGCGGGCAGCCCCTACGCCCCTGAAGAGCCCCAGGTAAGGGAGTCACCTGGCCTGGTTCATGCCTTTAAAGCATGCTCTGCTGCTGTGTGGCGAAGGGATTTGGAGAATGCAGGAATCACAGGCAAACCTTCAGGACCTGTGTGGCCAGCCCTGCTCGGGCTCACCTGTCCAGACACCCTGGCCTCCAGCCACACAAGCCACTGGCCACGTCAGGAGGCCCCTCTGCCTGAAACACCCTTTCTGCCCAGACACCGCGCAGCTCCTCCTCCTGGTCTTCACTTAAACACCCCTCCAGGATGCATCCCCGGCAGTGGCTGATCTGGCATGCGCAGCCCCAGCCACTCACTGGCCTCTTCATCGAATCCAAGCCGCCTTTCACTCAGCTCTGTCGGTTACAGGTCAACACCAGGAGGGCAGCATTTGTCTCTGGCTCCCAGCGCAGTGCCCGCTGCACACATGGATGCGTGGCCCACTCCTCGGGGCCTTTGCATTTCCTGTTCCCTTGGCCTGGAACGCTCCCTCCCCGAGTCCCTGATCACTGGTGCAGCATCTGTGCCTGCGATCCCTCGCTGGTGGCCACTCCCTGCCACCCCGTGGAGACACCCAGCTCTCCAGCCCCTTCCCTGTCTCTCCAGCCGCACTCTGCAAGTGCAGGGGTCTGTCTCTTCTTCTCTGGCTGCGGCCCAGAGCACAGTGCCTGGCACGACAGCAGATGCCCAGTGTTTGGGGGCAGGAGACCCTGGCCACTCTGTACAGCACAGGGATCTGCATCCAGACAGACCACAAAGGAGAAAACTGGACTGGGGTGGCAGCGGCAGAGGACAGGCCAGGGCAAGGCCCACTTCAGACCCTTTGGGCAGCGTGGAGGAGGAAGAACAAAGGCCAGGGCAGGGCCAGACGCGTGAAATGTCACAGTAGCAAGTTTACGGTGATGGAAGTGCCCGGTTAAATAATAAACCACAATCAAGAAAGCAAAGTGAAGGAGCAGTTTCCCACCGCCCTCCCCAACAGCCTGCTCAGGCAGAAACACGTGTTCCAGACTTACTATCTTGGGATCATTAATGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCACCTGAGGAAGGAAACCATGCACAGGTGAGGCAGGGCCCGGCCCGCTGGGCGGTCGGACTTCCTGAGTGCCCTGCACTGGTTCCCACCTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTTGATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTACAGCAGAATCTTGTACTGCAGATGAGACATTTCAGTTAATAATGAATACACCCCCGTCGCCAGGAACACACCACAGACGCGGGTGCTGCAGAGTGACATTGGTGCAGATAGCACAAAGCTGGCAGGACTGTCCGCGTGGCCGTGGAAAAGCTGGAACTGCCAGCTAGTACTGAGATAGTCACGGAGAGGCAGTGAGAGCATGAGGAAAAAGGGGAAATTGGGAGGTCAACCTAATGGCTCGCTGATAAAAGTTCAACTCGGCCGGGCACTGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAAGCTGGCAGATCACTTGAACACAGAAGTTCAAGAGCAGTCTGGGCAACACGGTGAAACCCCATCTCTACAAAGAATACAAAAATTAGCCGGGCGTGGTGGTGCATGCTTGTGGTCCCAGCTACTTGGGAGGCTGAGGTAGGAGGATCACTTGAGTCCAGGAGGTCGAGGCTGCAGTGGGCCGTGATCACACCACTGCACTCCAGCCTGGGTGACAGAGCAAGACCCTGTCTTTTAAAACAAAGCTCAACTTGTTATCTGAAATAAGATAAAGCAAACTATATTGCAGCATTCAGAAAGCATGAAATTCCGGGAAAAGCTCTCGAAAGCAAACATGTCACCTGGTCATCTTCATACCTCCAAGCAGGTGTCCCACACTGCCAGCACACAGCCGTTTGGGGCCCACTCAATCCCTGTGAGATCCTGGGTGTCCGTATCAAAATGCTTCCAAAGGAAGGGGGGGAAACATTAAATTTGGAAAATATTTTCGTAAATAAATAATTGCATTTATGACTGATGTTCTTAACGCACTTAATTTCCTTATATAGAAATTGACAAAATCTCAACAGCTCTATCCTGGAAATGCATGAAATCCCTGTAGAGCTGCTGCTGGGGCTGCACCGCCACAGATGCCAGCGTCAGTGCCTGGCCAGCCCCCAAGGGCGGCTTGGTCTCCCCGCGCCTGCACTCGTGTGCACACTCTCCCCCTCACCTTTCCTTGCCTGGCCAGCCCCCGAGGGCGGCTTGGTCTCCCCGCGCCTGCACTCGTGTGCACACTCTCCCCCTCACCTTTCCTTGCCTGGCCAGCCCCCGAAGGTGGCTTGGTCTCCCCGCACCTGCACTCATGTGCACACTCTCCCCCTCACCTTTCCTTGCCTGGCCAGGCTCACTCCTTTAGACCCAGCTCAGACAAGTCCCTTCCAGAGCACTGCCTGGATCCCGGGTTCTGCACTCTGACAGCATTCCAGAGGTTGCTCTACCTTAATGATGGATTGTGCTGGAATCGTGTTCATATGTCTGCTGTGGGGGCAGTGCCCTCTGTGCCTGGGCACCTGGCAGAGCGCCCTGCCTAATGCAGGCCCTCAGTCAAGGTGAACTTCCACGTCCCCCCAACTCCCGACGTGGCACACACATGCGCAAACACCATCACACAGGACAAGGAAAAGGGCTCAAATGTGACAGCATATTCACTTTTAAAACACCTGGGCACGCGTCCTTTTCACCAAGTCTCCTGAACACACAACCGGGTGCCACTGGAAGTGATTCGCAGCGCACCTGCCCTTTGTTAATACAACATCACCTTGCTCCATATCCTACCAAAGATCCCCTGGAATCTGGAAGGATCTACTTCACTCGATCCCTCCACAGTCAGCAGGACAACTTTATTCCAGTCTGGGGGACGCCTTACCCGCAGGAGCTGCCAATCACTGCAGACGAAGATGCTCACGTAATCTTTGCAGTCGCGCCGTTCTGCCAGCGCCATGTAGCGGCCGTCCCTGGTGAAGGTGATTCCCTGCAGACAAGCTTTCGGGTATTTGATGTAAGACACGGATTTTGTGCACAAGGACCAGACGGTTATCCGCAGCTGTTGGGGGAAAGGGGAAAGAGAAAGGAAACACTTCTTTAGCATCATCAGAGACCGTCTCAATCCTCAACCCGCCCACGCGTCCCCAAGCACAGGCCTGACTGCTGGAGTGGATCTATCAGGACCTGGGGGATGCCTGCCCTCCTACCGGAATATTCAAATGCGTATTTTACTGTGGTTACGGTAAATTTGGTGTTCTTGGTTTTCTGTTGTTGTTGTTTTATACCAAAATTGAGTGACACAAAGTTAAATCCAAGTGCTTTTTCATTAGCTTTTTCAAAGTGACCATAGGTTGCATGTTATAATAACCCTGAGTTACTCAGAGAAAAATCTTGATCTAGAAACCACCACGGGTTCAGTCTCCTTTATGGGAAGACAGAGGATCTGGAGATTGGATGCAGCCACTCCGGGACTCACCAGGGGGCTGTGAGCCTGCATCTGCAGCCCTGAGGCAGGAGCAGCCACTCAACACCCAAGAAGGTGTCCGTCTGCCTCCTGCGTGTGCTCGCTGGCCTGGCTGCATCTGCAGAGGGTTCTAGAACATGCGCTGCTGGACTGTCCACTTTTCCACCCCTTTCCCTGACTCAGGGAGCTGAGAGCTGACTAGGCTGGCACAGTGAGGCCAAAAGATGATTTTCTAACCAGGCCGACGAGGGCGTGCCTGCTGAGGGAGAGGCACCGCAGTGGGTGGTCCAGCCCTCCCCGTGGCAGCGCCGCGGGACTTCCAGGGCTGCTGTGTCCCTCCACCTGCATTTCCCACTGAGACCCCGTGGAGCCTACCAGGGAATCATCTTGCTTCCCAC +>ENST00000424367 +CGTTCCTTGTCGCCAGGAAGTAGCTGTCAGGACTAAATGCCAGCATTCCTATGCCGATTTTCGGGTTTGCTCTGTCGGTAACAGGTTTCAGTGTCTGTAAGGAGACTGGGACAGAGGCGATCTCATATTTACTCTCTGAGCTCGGGAGAGGGCCGGCCCCGGCCCGGGGCGGCGGGAAGGAGAGGCAGCCCAGTCCCAGCTGTGGGCTCTTCTCGGCCTCCTTATACACCACTATCTTGGGATCATTAATGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCACCTCCAAGCAGGTGTCCCACACTGCCAGCACACAGCCGTTTGGGGCCCACTCAATCCCTGTGAGATCCTGGGTGTCCGTATCAAAATGCCGCAGGAGCTGCCAATCACTGCAGACGAAGATGCTCACGTAATCTTTGCAGTCGCGCCGTTCTGCCAGCGCCATGTAGCGGCCGTCCCTGGTGAAGGTGATTCCCTGCAGACAAGCTTTCGGGTATTTGATGTAAGACACGGATTTTGTGCACAAGGACCAGACGGTTATCCGCAGATGGAATTCCGTGGTGTTGAGAATGTGGCGCCCGTCCGGGCTCCAGCACGAGGCCACCAGCCCGGCTGAGCCCTCGTCTATTTTGCAGTGCCATTCGGGCTGCTCTAAAGACCAGACCTGCACCAGCCCTCGCTTGTACATGGCGCACAGGATGAAGAGCGAGTCTGCCGACCACTCGATGTGCTGGATCTGGTCTAGGCACGTGTACAGCTGAAGGATCTGAAGGGTGTTCACATCCCGGACCACTAACCGGTACTGGACACAGGAAGCCAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGAGAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCC +>ENST00000497940 +GGGGCTGTGGAACAAGGACGCCCCTGGGCTCCTGGGGAGCGCCTCCTGTGTGCCAGGCTGCACCTGTCCTGACCCCCATCCTGAGCACACACCGAGCCCCGGGGTGGGCCCGTCGGCACTTGGGGCACCGCTTCCTCTACCTGCAACCTTCAGATGCCCTCATGCCCCTGTGGGATGGGTGCTTTTACTATGCCCATTTCAGCGATGAGGAAACAGACACATAGGAAATGCCCAGAGTCAAGAGGCTGCATCAGAACCGGGCCTCAAGCCGGAGACAGCGCTCGGGAGCACCGCCGGGTTCCAGACCCACTCTGAGCGCCACCCACGGAAAAGTGTTTCTTTGAAAAACATCATTCTCGGAGCTCCGGAAAAACATCCCCTCGGAGCTCCCGCTGTCAGATCCGGGTCTCCAGGGCTCATATTCAGTAACAGAAGCCGCACCTTCACGGCCCACTGCGCAATTCAGACCCTAGTCAACCTCCAGCCAACAGGCTGAGGGGCACACTGGCTGGAAGCATGGAAGGGAAAAAAAGTTTTTTTTTTTAAACATAAGGAACATCCGAAGTTTATCTGGACAACGAGGAATCTTGCATTAAAAAAGGAAAACAAATGACATCACATGTGCTACTTACATTTACTCTCTGAGCTCGGGAGAGGGCCGGCCCCGGCCCGGGGCGGCGGGAAGGAGAGGCAGCCCAGTCCCAGCTGTGGGCTCTTCTCGGCCTCCTTATACACCACTATCTTGGGATCATTAATGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCACCTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTTGATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTACAGCAGAATCTTGTACTCCAAGCAGGTGTCCCACACTGCCAGCACACAGCCGTTTGGGGCCCACTCAATCCCTGTGAGATCCTGGGTGTCCGTATCAAAATGCCGCAGGAGCTGCCAATCACTGCAGACGAAGATGCTCACGTAATCTTTGCAGTCGCGCCGTTC +>ENST00000469643 +AAACATAAGGAACATCCGAAGTTTATCTGGACAACGAGGAATCTTGCATTAAAAAAGGAAAACAAATGACATCACATGTGCTACTTACATTTACTCTCTGAGCTCGGGAGAGGGCCGGCCCCGGCCCGGGGCGGCGGGAAGGAGAGGCAGCCCAGTCCCAGCTGTGGGCTCTTCTCGGCCTCCTTATACACCACTATCTTGGGATCATTAATGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCACCTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTTGATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTACAGCAGAATCTTGTACTGCAGATGAGACATTTCAGTTAATAATGAATACACCCCCGTCGCCAGGAACACACCACAGACGCGGGTGCTGCAGAGTGACATTGGTGCAGATAGCACAAAGCTGGCAGGACTGTCCGCGTGGCCGTGGAAAAGCTGGAACTGCCAGCTAGTACT +>ENST00000494884 +CAAGAAAGCAAAGTGAAGGAGCAGTTTCCCACCGCCCTCCCCAACAGCCTGCTCAGGCAGAAACACGTGTTCCAGACTTACTATCTTGGGATCATTAATGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCACCTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTTGATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTACAGCAGAATCTTGTACTGCAGATGAGACATTTCAGTTAATAATGAATACACCCCCGTCGCCAGGAACACACCACAGACGCGGGTGCTGCAGAGTGACATTGGTGCAGATAGCACAAAGCTGGCAGGACTGTCCGCGTGGCCGTGGAAAAGCTGG +>ENST00000465916 +TGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCACCTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTTGATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTACAGCAGAATCTTGTACTCCAAGCAGGTGTCCCACACTGCCAGCACACAGCCGTTTGGGGCCCACTCAATCCCTGTGAGATCCTGGGTGTCCGTATCAAAATGCCGCAGGAGCTGCCAATCACTGCAGACGAAGATGCTCACGTAATCTTTGCAGTCGCGCCGTTCTGCCAGCGCCATGTAGCGGCCGTCCCTGGTGAAGGTGATTCCCTGCAGACAAGCTTTCGGGTATTTGATGTAAGACACGGATTTTGTGCACAAGGACCAGACGGTTATCCGCAGATGGAATTCCGTGGTGTTGAGAATGTGGCGCCCGTCCGGGCTCCAGCACGAGGCCACCAGCCCGGCTGAGCCCTCGTCTATTTTGCAGTGCCATTCGGGCTGCTCTAAAGACCAGACCTGCACCAGCCCTCGCTTGTACATGGCGCACAGGATGAAGAGCGAGTCTGCCGACCACTCGATGTGCTGGATCTGGTCTAGGCACGTGTACAGCTGAAGGATCTGAAGGGTGTTCACATCCCGGACCACTAACCGGTACTGGACACAGGAAGCCTGGGCTCGCAGCTCCGAAGCTGGGAGGTGAGGGGAGAGCGATCGGGGA +>ENST00000419924 +AATGAGTACAGCAGAATCTTGTACCGCAGGAGCTGCCAATCACTGCAGACGAAGATGCTCACGTAATCTTTGCAGTCGCGCCGTTCTGCCAGCGCCATGTAGCGGCCGTCCCTGGTGAAGGTGATTCCCTGCAGACAAGCTTTCGGGTATTTGATGTAAGACACGGATTTTGTGCACAAGGACCAGACGGTTATCCGCAGATGGAATTCCGTGGTGTTGAGAATGTGGCGCCCGTCCGGGCTCCAGCACGAGGCCACCAGCCCGGCTGAGCCCTCGTCTATTTTGCAGTGCCATTCGGGCTGCTCTAAAGACCAGACCTGCACCAGCCCTCGCTTGTACATGGCGCACAGGATGAAGAGCGAGTCTGCCGACCACTCGATGTGCTGGATCTGGTCTAGGCACGTGTACAGCTGAAGGATCTGAAGGGTGTTCACATCCCGGACCACTAACCGGTACTGGACACAGGAAGCCAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGAGAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCCTGCGCCCGAAAACCCGCGGGACCCCTGGGCGCGCAGC +>ENST00000479331 +TTTAAATGTTCTTAAACTTTAGAGAACGTTATAATTTCAAAAGAAAACTGGCTTTGAGCTGCACGGACTTTTTTTTCAAACTAGAAAGGCACAGAACAAAACCCCTCCTTCCCAGGGGCCCTCAGAAGGTGTCCAGATTCTAAGCGACACGGCAGCACACACCTGCACCAGCCCTCGCTTGTACATGGCGCACAGGATGAAGAGCGAGTCTGCCGACCACTCGATGTGCTGGATCTGGTCTAGGCACGTGTACAGCTGAAGGATCTGAAGGGTGTTCACATCCCGGACCACTAACCGGTACTGGACACAGGAAGCCAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGAGAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCCTGCGCCCGAAAACCCGCGGGACCCCTGGGCGCGCA +>ENST00000377837 +TTTTTTTTTTTTTTTTTTTTTTGAGACGGAGTCTCGCTCTGTCGCCCAGCCTGGAGTGCAGTGGCGTGATCTCGGCTCACTGCAAGCTCCACCTCCCAGGTTCATGCCATTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGACCACAGGTGCCCGCCCCCACGCCCGGCTAATTTTTTGTATTTATAGTAGAGATGGGGTTTCACCGTGTTAGCCAAGATGGTCTCGATCTCCTGACCTCGTGATCTGCCCGCCTCGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGCGCCCGGCCCATCTTAACCATATTTAAGCATCATGCACATTCACATTGCGGTGTAGCCATCAGCAGCATCCATCTCCAGAGCTCTTTTCCTCTTGCAAAACTGAATCTCTGTACCCATGAAGCACCAACTCCCCATTCTTCCCACCCCCCAGCCCCTGCCAACCACCATTCTTAGATGTGATATCTTTGTTAGAGCAGATTAACTTGCTCTCAGGTGTATGGTCTGCGGCCATTGACTCAAGCACAGGGAATGAGAACTTCTGGAAGTGGGCCTGGACATCTGAATTGCACAGGCTTCCCAGATAGGTACGAAGGAACAAGAAACAAAACAAACATTACCGCAAATGAAACACTGTGTAAATATGTGGATTACATCCTGTAAGTACGAAGAGAATGGAAGGCATTTATCTTGTTATTGTCACTGGGGCAGATCCGGAGTCAGCTCTGGGCGGAGATGGATTTACCCTGGAGCTGCTGAAGCTTAAGCTGGGGGCTGCTCAGGAGCCTGGATGTAGAGTAGGAAGCAGTTCTGAGCATGGAGGGGAAGCCAGGTGTGCCAGCCAGAAGCATCCTCCCGGCCCAGCAGCGGCAGGATGAGCCCCTTAAGCTGGCTCAGGCTCTGGTTGATGCGCGCGCGCCGGCGCTTCTCCAGCAGCGGCTTCAGGCTCTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGCGGTGGCAGCTCTGGAATTGCGTCGCCGGCGCCTGGAACCGCAGTTAGCGGGCACTGGGCAGATGAATGAATTTGTCTGTGCCTGGACGGCTCTCCAATTCGAACCCAGTTTTGCTGCCCTCTGGGGTCTCAACTGTTACGTGAGGCAAATTAGGAGAGAAGCCCCTGGGCACCTTGCCCCAGTCGCACGAGTGTCCCCGCG +>ENST00000377836 +CACAGGCTTCCCAGATAGGTACGAAGGAACAAGAAACAAAACAAACATTACCGCAAATGAAACACTGTGTAAATATGTGGATTACATCCTGTAAGTACGAAGAGAATGGAAGGCATTTATCTTGTTATTGTCACTGGGGCAGATCCGGAGTCAGCTCTGGGCGGAGATGGATTTACCCTGGAGCTGCTGAAGCTTAAGCTGGGGGCTGCTCAGGAGCCTGGATGTAGAGTAGGAAGCAGTTCTGAGCATGGAGGGGAAGCCAGGTGTGCCAGCCAGAAGCATCCTCCCGGCCCAGCAGCGGCAGGATGAGCCCCTTAAGCTGGCTCAGGCTCTGGTTGATGCGCGCGCGCCGGCGCTTCTCCAGCAGCGGCTTCAGGCTCTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGCGGTGGCAGCTGCGAGCCCCACGCAAAGGGAAACCGAGGTCCGAAATGAGGTCCCGGGCGCGGCCCGGG +>ENST00000471190 +CCGCAAATGAAACACTGTGTAAATATGTGGATTACATCCTGTAAGTACGAAGAGAATGGAAGGCATTTATCTTGTTATTGTCACTGGGGCAGATCCGGAGTCAGCTCTGGGCGGAGATGGATTTACCCTGGAGCTGCTGAAGCTTAAGCTGGGGGCTGCTCAGGAGCCTGGATGTAGAGTAGGAAGCAGTTCTGAGCATGGAGGGGAAGCCAGGTGTGCCAGCCAGAAGCATCCTCCTGACTCAGGCTCCCCCGAGTGCCTGACCCTGTGAGTCACTGGCCCATCTACAATCCTTCTCCCCGTGACTGCTTGAGTTGTAGCTTGATTGGAGCCAGGTCAATGCAAGTCA +>ENST00000377834 +TTTTATTGCAGTTCACTTTATTGCACGTCAAGATATTGCCTTTTTTTTTTTTTAAACAAATTGAAGGTTCGGGGTAACTCCAGAGTCAAGCAAGTCTATTGGCAACATTTTCCCACGAGCATGTGCCCACTTTGTATCTGTGTGTCACACTTTCGCAATTCTTGCAATATTTCAAACTTCTTCCTTATTATATCTGTTGTGAAGCTGGTTCTCCCAGACGTTCCCTGCAGGCTGTTTATGCAGCGCCCATCCGAGATGAACCCACAGGACACTCAGGATCCCAGACTGCAGGAGTCGTCTGGGATCACAGGCGGGGCAGAGCAATTTGTCAATGTTTATGAGGAGTCCTCCTTGGCAGCCCAGTCTTTATCCTCACTCACGTGGAAATGAGATTCGACCTCTCCTAATCACCTGGTGCCCGAGGAGCAGGTAGGCGCCTGTCCCAAGCCTGAGTTTCCTGGGAAATCTACATTTCAGCACAGATGGGTTCCCAGCAGCTTAGTGCTCTGGCTGTCCTTAGGTCACTGAATCATTTCACCCGCTAGTTTTTTGTTTGTTTGTTTTTGAGATGGAGTCTTGCTCTGTCACCCAGGCTGGAGTGCAGTGGCGCGATCTCGGCTCACTGCAACCTCCACCTCCTGGGTTCAACTGATTATCCCTCCTCAGCCTCCCAAGTAGCTGGGGTTACAGGCACCCGCCGTCATGCCCAGCTAATTTCCATATTTTTGTAGAGACGGGGTTTCACCATGTTGGTCAGGCTGGTCTTGAACTCCTGACCTCAGGTGATCCGCCCACCTTGGTCTCCCGAAGTGCTGGCATTACAGACGTGAGCCACTGCGCCCGGCCTTGCCCACTGGTTTTATGAGAAAGAGACATGGGAGCCTTTTCCCCAGCTGGGGCAATCATCAGACAGTCACATGGAGTCACAGAACCATCTTGCAACAGCATCCCAAGACCTGGCCATTGGGCAGGATGTGGGACTTGTGAAAGGTCATAAATGACCCTTTGAATCAGTCTCCCTCTGCACAGGAAAAGCCCACCGCCCTGCGTTCACCTTTGCCCATCAGATAGGGCTTGGGGGGCACCTGAGGAGGAGGTGCCTGCCACTGCCTGTGGAGGAGGATGTTGGCGTTCCTATTTCACAAGCCCGGCTTGGAGAGCCAGCGGAGACCTTCTGCGCAGCTAGCTCTTGCACACACCCCTGCGGAGAAACTCTGCCTTCTTGCCTGGGGCCCAGAACCTTACCCACCCAGGCTTGCCCCCTCCCTTCCAGGGCCCACTGACCTCCTGACTCAGGCTCCCCCGAGTGCCTGACCCTGTGAGTCACTGGCCCATCTACAATCCTTCTCCCCGTGACTGCTTGAGTTGTAGCTTGATTGGAGCCAGGTCAATGCAAGTCACAGAACTGCGAACTGAGATGGACTCTCAGAAGCAAGAGGTGGCAAGCATGGCGGAGAGGAAGCGAGGGTCCTCCTGGCTGGTTAGATCTTACAGAGTTTAAGCTGTACTGAGAGTTTTTATGAGGACAAGGGGCCAGTCCTGTGCCTGCCTGATGTGGAGTCCTAGGCGGGCTTGGGCCGCAGGTTACCTGCTCCCGGAGGCTCACAAAGGCAGTGCCAACAGGCGCTCATTCTCAGCAATGGGTGAAAGTAAGAGGAACCTGCCCTCCCTCCTCTCCACACCTCCCCAGTATTTGTCCTCATGGAGTAAATATCCAACAGTGATCCCAGGGCATGGGAGTGGGAGTTAAGGCAAATGCCAGACTGTCCAAGGCTCATTACAGGGTAGTCCTCTCATCCTCTGCTCACTAGTCCACTATATTCAGTGAGCACCCACTGTGCACCCTGTGCCTTGGGGACGTGGAGGCACGCTCAGCCCCAGCCTCGCCCTCCGGGAGCTTACAGTCTAACCCTCTGGGCACAGGGAGGTGGGAAGATGGCACGGCCTTGCTGGGAGCCTCACCCTGTTGGCTGAACAATGATTTTTTCAATAATGCCTACAGCTTCCTTCATATCCTGCCACCCAAACCAGTGCCAAGGTCATCATGGGCTTGTGTGGCACAGTCAGATTTAGTGACCATCCCCACTCCCACATTGGTTCTGTCTTCTTGCCCCCGGTGCTCTGGTCCCTAGCACAGGCTGCTGATTTGGGGACTCGGGGGAGAATCCTCCACCTTCTGCAAATGCTTAGCCATGAAATGACGGGTGTTTGCCTGACTATGATTTCATGAATCCCCCATGAAATGATGGGTGTTTGCCTGATTATGGGCCAACAGTGCCCCCCACTCCTCGTGGGCACTCCTGGGATCAGCAGCCCCTTCCTAGCCTTCACAGGGACTCTAGGCCTCCATGGAAAAGAAAGAAATAAAAAATTTTTTTTGAGACAGAGTCTTGCTGTGTCACCCAGGCTGGAGAGCAATGGCTCAATCTTGGCTCACTGCAACTTCAGCCTCCGAGGTTCAAGTGATTCTCTTGCCTCAGCCTCCCGAGTAGCTGGCACATGCCACCACACCCGGCTAATTTTTGTATTTTTAGTAGAGACGGGGTTTCACCATATTGGCTAAGCTGGTCTCGAACTCCTGACCTCAGGTGATCCACCCGCCTTGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGCGCCCGCCCAGAAAGAAAAATCTTAACAAGTTGCTTCCAGTAACCAGTCTCAATGAGTAGCAGGGAGTAGTTTGCAAGAAAAAAAAACAAGTGAAGATGTTTCCCATTCTTTAACCTGCTCCATCCCTCAAATTCCTGCTGCTCCATGGCAGGGGCCCTGCTCACCCCACATTGGCACAGACTCTGCTGGAGTCAGATCCTCCAAAGCCACAAGCTTCCTTGAGGCCACGGGGCCGCCTCATTCTTGTTCTGCCCCTTCCTCACACTGAAAGACTGCATAGCCTGGGGTGCAATGCCCAGGTGTGAAATTGATGCTCGGGAAAACAAATCCTTCCCAAAGTCACTTAAGGAATCCCCCAGCCCCACCGCACAGACCCCTGGATGTATACTGCCCCTATAATTCTGCTCTAGGCAGAAAAGCCTAGGAGTGGAGGTGACAGCTCCCAGCATATGCACCCTTTTGCTCTGCTCTGCTGCCCTGTAGAGCCCTGGAAGTGACCAGAGCCCTTAGGCTACTGCTGCTGCATGCCCAGAGGGTCCCAAGCAGAGCTGGGCAGGAGGTAGGCCCAGGCAGGGCTGGGAGAGCAGTGACCAGGCAGGGTGCACGGCTGCACTTTGCCCAGGTCCTGGCTCTGGCTCTGGTCTGGTGCCAGTGCTGGGGTGGGTGTGTCGGCTGCCCACGCAGCTGCGGGGTCCAGTTCCAGAACTATCTCCACCAGCTGGGATGGGGGGCTTCTTCTTCACCCTGCTGCCTCTTGTCCTTTCTTCTCCAGCCAAGTTGGGGGTGAAGCAGGGACGCTCCTTTTATTCCCTGAGCCGAGCCCCAGCCCCAGGGCTTTCAGTCTGCCACGCCAGTCACAAACAGCCGGCTTCCGGCCTGGGTGTGGGTACTGGGCTGGCCCCTAATGATGGGAACAGCAGCCGCCACCAAGAGCTTCAACCTGTCCAGTGCCCCAAGGTCCCAAGCAGTCGGCAGGGTCTGTGGATCGGCCGAGGGGCTACCACGGCCGCCAGAGGCCAGGGCCGCAGGGAGGCGAGGGCGGCGAGGGCACCGGAGCGGATGCGGGCTCTGGGGCAGACGCGGGCGCTGGGGCGGGGGCAGACGGGCCACTGGAATCCCCAGCGCGCCCGCCGTCCAGGGTGGCGCTGGCCGCTCTCCGCCACAGGTGCTCCAGCAGGCGCGCGCTCACGGCGGGCTCCAGGACACGGCAGGCGGGCAGCACGCGGGCCAGGCGCGCCACACAGGCGCTGTAGCCCTCGCGGTAGCTGTCGCAAGGCAGGGGCGCTGCCGTGGGCCATGAGGACGCAGGCAGCTCCTGCAGGAAGCGCACGGTCATTTCCAGGACGTCTGCCTTCTCTAGCTTCGAGCAGTTGGAGTTCTCCCGGCCCAGCAGCGGCAGGATGAGCCCCTTAAGCTGGCTCAGGCTCTGGTTGATGCGCGCGCGCCGGCGCTTCTCCAGCAGCGGCTTCAGGCTCTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGCGGTGGCAGCTGCGAGCCCCACGCAAAGGGAAACCGAGGTCCGAAATGAGGTCCCGGGCGCGGCCCGGGCTGGTGCCAGACGAGT +>ENST00000487437 +CCAAGCAGAGCTGGGCAGGAGGTAGGCCCAGGCAGGGCTGGGAGAGCAGTGACCAGGCAGGGTGCACGGCTGCACTTTGCCCAGGTCCTGGCTCTGGCTCTGGTCTGGTGCCAGTGCTGGGGTGGGTGTGTCGGCTGCCCACGCAGCTGCGGGGTCCAGTTCCAGAACTATCTCCACCAGCTGGGATGGGGGGCTTCTTCTTCACCCTGCTGCCTCTTGTCCTTTCTTCTCCAGCCAAGTTGGGGGTGAAGCAGGGACGCTCCTTTTATTCCCTGAGCCGAGCCCCAGCCCCAGGGCTTTCAGTCTGCCACGCCAGTCACAAACAGCCGGCTTCCGGCCTGGGTGTGGGTACTGGGCTGGCCCCTAATGATGGGAACAGCAGCCGCCACCAAGAGCTTCAACCTGTCCAGTGCCCCAAGGTCCCAAGCAGTCGGCAGGGTCTGTGGATCGGCCGAGGGGCTACCACGGCCGCCAGAGGCCAGGGCCGCAGGGAGGCGAGGGCGGCGAGGGCACCGGAGCGGATGCGGGCTCTGGGGCAGACGCGGGCGCTGGGGCGGGGGCAGACGGGCCACTGGAATCCCCAGCGCGCCCGCCGTCCAGGGTGGCGCTGGCCGCTCTCCGCCACAGGTGCTCCAGCAGGCGCGCGCTCACGGCGGGCTCCAGGACACGGCAGGCGGGCAGCACGCGGGCCAGGCGCGCCACACAGGCGCTGTAGCCCTCGCGGTAGCTGTCGCAAGGCACTCCCGGCCCAGCAGCGGCAGGATGAGCCCCTTAAGCTGGCTCAGGCTCTGGTTGATGCGCGCGCGCCGGCGCTTCTCCAGCAGCGGCTTCAGGCTCTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGCGGTGGCAGCTGCGAGCCCCACGCAAAGGGAAACCGAGGTCCGAAATGAGGTCCCGGGCGCGGCCCGGGCTGG +>ENST00000489730 +AGGGTCTGTGGATCGGCCGAGGGGCTACCACGGCCGCCAGAGGCCAGGGCCGCAGGGAGGCGAGGGCGGCGAGGGCACCGGAGCGGATGCGGGCTCTGGGGCAGACGCGGGCGCTGGGGCGGGGGCAGACGGGCCACTGGAATCCCCAGCGCGCCCGCCGTCCAGGGTGGCGCTGGCCGCTCTCCGCCACAGGTGCTCCAGCAGGCGCGCGCTCACGGCGGGCTCCAGGACACGGCAGGCGGGCAGCACGCGGGCCAGGCGCGCCACACAGGCGCTGTAGCCCTCGCGGTAGCTGTCGCAAGGCACTGCGGGCGGAGAGCCGCGTGAGGCGCGGGGTAGGGTGCCGGGTGCGGGGTGCAGAGCGCGCGGCAGGGCAGGGAGGGCTCACTCACGGGGCGCTGCCGTGGGCCATGAGGACGCAGGCAGCTCCTGCAGGAAGCGCACGGTCATTTCCAGGACGTCTGCCTTCTCTAGCTTCGAGCAGTTGGAGTTCTCCCGGCCCAGCAGCGGCAGGATGAGCCCCTTAAGCTGGCTCAGGCTCTGGTTGATGCGCGCGCGCCGGCGCTTCTCCAGCAGCGGCTTCAGGCTCTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGCGGTGGCAGCTGCGAGCCCCACGCAAAGGGAAACCGAGGTCCGAAATGAGGTCCCGGGCGCGGCCCGGGCTGGTGCCAGACGA +>ENST00000635687 +TTACATTTTTAATAGACTTTTATTTTGGAATAATTGTAGATTTACAGAAAAGCTGCAAAGAATAGTACAGAGAGTTCCCTCAAATTCTTCGCCCAGTTTCCTCTAACATTTGCATCTTACACAGCCATGGCACATTTGTCAAAACTAAGAAATTAACACTGGTATTACTTTTAACTAAAGGCTTTTTTGGATTTTACCAGTTTTTTCACTCATGCCTTGTTTTGTTCCAAAATCCAACCCAGGATATCACACTGCATTTAATCAAATGTAAATACGTATGCTTTAACTTTTTTATTTTAAAATAATCATAGATTTACAGGAAATTGCAACAACAACAAAAAAAGTACAGAGATTCTGTGTACCCTTCCCCCAGTTTCGTTCAGTGGTAACTCCTTGTATAACTACACAATATCAAAACCATGAAATAGATATTGGCACAATCCATAGACAGTATTAAATATACATGCATATATATATATTTTTAAGTGAAAAATATTTTTAAACCTCGCTTTGCCTCACAGCCAAGAAGATCAAATACTTTCTCCAAAAACATAGAATTTGTATCTAACTCCACTCGCTCCAAACTCAAGTCCAACCATGAAATTATTGATCCCTCTCTCTAACCCTCCAACTACAGGCAAGAAGCTGCCCATACATTCCCCAAAGCAGGAGTGCACTCTGCCACAGGCCTAGATGCCGTCAACCTCCTGGACCTTGAACTCCCTAAATTAATGGCCTCTGTGTGAGTATGTGTAAGCAGCCCCTCTCTGTCCCAGTCCATCCTAAAATCACTCCCTTGGAGCCACCACTGCCCCTCTCATCTTCTAGAATTTCTAGAAAGATAAAGAGCTAGATAAGCATCTAGGTACCTTTCTTCTGCTGTTAGCTCTAAAGACAAGTGAATATATCCTAGCTAGGATGTACTCTAAGGAATGCAGAAGTAGGCCGAGTGCAGTGGCTCATTCCTGTAATCCCAGTGCTTTGGGAGGCCGAGGTGGGCGGATCACCTGAGGTCAGGAGTTTGAGTCCAGCCTGGTCAACATGGCAAAGCCCCGTCTCTACTAAAAATACAAAAATTAGCTGGGCGTGGTGGCGGGTGCCTGTAATCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATCACTTGAACCCCCAAGGCAGAGGTTGCAGTGAGCTGAGATGGTACCACTGCCCATTTCAAAAAAAAAAAAAAAAGAATGCAGAAGTAAATTAAATGACCACAAAGAGTTTTTTTTAATTTGAGACAGGGTCTGGCTCTGTCACCTAGGCTGGAATACAGTGGCGCAATCTCAGCTCACTTCAATCTGTGCCTCCTGGGCTCAAGCCATCCCCTGACCTCAGCCTCCTGAGTAGCTGGGACTACAGTCCTGCCACTATGCCTGGCTAATTTTTGTATTTTTTGTAGAGATGTTGCCCAGGCTGGTCTGAAACTCCTGAGCTCAAGGGATCCATCCACCTGGGCCTCCCCAAGTGCTGGGATTACAGGCATGCGCCACCGTGCCCAACCCAGACATCACTTTTATCTGAAGCAACAACTATCTGCTCTTTCTGTTTCCTTACTAATTATCCAGGAACTTTTACAGGTGAACTCTGAGGAGGACAATTTTTATTGTTTTTATGTCAGCATAACTAAAAGTAAAGCTGGATAGGAAGAGGTTACTTGAAAATGATTTCACCTGAACTCAAATGAATAAGCTGGCTACTGCATAAAGCAACAGAGGGGTCCCTTTAATTTAAAAGCTCAGGACTCTGAATCAATTGCTGGTTGGGAGAAGGTAGAGACATTCTTTACTTCTGCCTAGAACTGGGGAAAATGGCGTAGACTTCTGCTCTGAAGCAGTCCTCAGTGCTGCTTCGGTCAGAACTCCCGAGAGGCATCTGAGTGCTGGCCTGTCACTGCGGCTGGCATTCCAGGCATTTCATTGGCCCCACTTCAGCCCACGCCTGGCTCCACGGGGCTGGGCAGCTGAGGGGAGTTTGTGGCAGAGTGGGCATGGGGCACGGCCCGTGCAATGTGCGTTACAAAGGGGCTCTCTCTGAAGCAAGTCCTCTGCACTCCAGTCTATTTGAGGAAGAAAAGGACAATTCCCATAGGGAGGGGGTTTGCTGAAGCAACCAGCTGCCTGGTTTCCTCTCCAGCATTGAGAGGGAGGGAGGGCTGGCTTAACTGGGGGACGGCCTTCTCATCTGGACTGTGTCAAGGCCAAGGTTAGGCTCCAAATTCCAGAAAACCTCTCTGCAGGGTCTTCTTTCAGAGTGGTGAGAATGGAAGCAGGCTCCCTTCCCCTCCAGCACTAGGAAGCCCCGCAATTGGTGAGGTGCAAAGAAAGATGGGCCCAGGCAGGGAGGCGGGAGCAGGGGAGGTGCCCAGGGCAGTGGCTGGAAGGGCAACGGGAGAAGCAGCAGAGGCTGGGGGTGGGGGTCGCAGCAGGTGCTGTCCCTGGCCTGTGTGAAAGGTACTAGAAGGCCCCATCCTTGGTGCCACATGGACCCCAGAGGCTTGTCTTAGTCCATGGGGTCCGAGGTGTAAGACACTTACGTTTGGCGTCACCTCTTAGGCTTGGATGAATTTCAGAAAGTGCTAGACTGGAGAACAGTGGAAAAAATCAGTGGAACAAGATCTGGAGCACTCACTGCTCAATGTCAATGTTAGAGAGCACAACGACACCAATGGGAGGAGGGTGAGGACCAGAGGCTGATTGCATGAGCTCTGTTGGAGTGCAGGACCCACTAACGGGTTATCTCAGGGTTCCTGGAGGCCACGGCTGTGCCTTGTGGTCCAAGACCTGGGGAAGCCACCACTGTGTCTTCCCTCTCCATCCTCCGGTGACTTTGGTCCAATTCCTGTTGCCATGGCAATCAGCCCAGCTGGCCTCACAGTTCACTGGCCTCAAAGTTGGCATCTGTAGGTGAAGCCAGTGGGACCCAGAGAACTTAATTCTTCTCAACTGAGCTGGCTTGGAGGAACTTTTCTCATCAGCCACTGGAGCAGAGAACGTCACCAGCGTCTCACTGACGTCAACATCCTGGGCCTGGCTCTAGCTGAAAAGGAAAATTCTCCCCAAGGCAGACACATCTCCCGAAGCCCACACAGGCACTTTCTATGATTGCACTGGAAATCTGTCTCCTGGGGACAGGGAGCGCGTACGCTCACAGTCAAGTCACAATGTTGAGCAGTCTCCAGGACTCCACGTTCATCTCTAAGAACAGGAGCCGGTGGTTGGGCGCAGATTCTTGAGCCAGATTGCTCGCGTTCAAAACCTGGTCCCTTTTTATTAATTGCATGCTTAGTTACATTTTCTGTTTGTACTTTTGTTTCCTTCTCTGCAAGACGGGGTTAATCACAGACACTTGTACATGATGTAATACACTTACAATACTTAGGACAGGCCTTCCTGCATAGTAAGTGCTCTGCAAACACTGGCTACTATTCTCCCTACGTGCAAACTTCTCCCAGCCAAAAGCCGCCCACACCAAGCCCCTGTGCCTTTTTCCTTCCGCACCCACGAGCAGGCTGCTCCTGGGGCCCTGGAGCTCACTTTCCCAGCCGCCCTCACCACCCACCGTGGCGCAGAAGAGCTTCCGAAGTCCTGGCGTCTCCCACTGGTCTGGGCATCTCTCGCTTCATCTTCCCTCTTGGGCCCCACAACGTGCAGCACTTCTAGGGCAGTATACTTGCTGATTGCTTCCTTACTATTGCTCACAACAACCAGCTAAGACACTGCCAAAGAAACACTCACAGCTGGCCGGTCCACGGCATCCGGAGGGGACTCGGGGGACAGGCCTGTCCTGCCTCTCCCCAGCACCTGGGTGCATGCTGGGACGGGGCGAGCAGGTAGTGCAGGCTTCCAGGCCTCTCCTGCCCCGGAGCTTGGCTGCAGGACTCCCGCAAAATCTCCAAATGCCCCCGATCTGCGTGGTCACCGAGAAGCAGCCCGGCTCGGAACAAGCCCAGGCAAGCCCAGGCAGAGCCCGCCGCCGGGTCCTCCTTCCTGCTCGTGCCACCAGGCCCCGGGGCCGCGACGCGTCTCTCCAGCCCGGGATCCGGGGAGCTGGGCTGTCCCCAGACCGACGGGACAGCGGCATCTCCTCCACCTGAAAAGGAAAGAGGACCAGGTGGGGGCCAGGCAGGGCGCATGAAGGCGGCGCCAGCACCGCGCGATCCGAATCACGTCGGTGCGGGGGAGGGGTC +>ENST00000385130 +GGGCCCCACAACGTGCAGCACTTCTAGGGCAGTATACTTGCTGATTGCTTCCTTACTATTGCTCACAACAACCAGCTAAGACACTGCCAAAGAAACACTCACAGCTGGCC +>ENST00000437157 +CTGGGTGCATGCTGGGACGGGGCGAGCAGGTAGTGCAGGCTTCCAGGCCTCTCCTGCCCCGGAGCTTGGCTGCAGGACTCCCGCAAAATCTCCAAATGCCCCCGATCTGCGTGGTCACCGAGAAGCAGCCCGGCTCGGAACAAGCCCAGGCAAGCCCAGGCAGAGCCCGCCGCCGGGTCCTCCTTCCTGCTCGTGCCACCAGGCCCCGGGGCCGCGACGCGTCTCTCCAGCCCGGGATCCGGGGAGCTGGGCTGTCCCCAGACCGACGGGACAGCGGCATCTCCTCCACAGTTTGCAGGACTCCGAACTGGGCCCGCGAGATCTCCACCTGCGCAAAACGAAAGGGCGGATTCTCCTTGGACTCACGAGGCAACCGCTCCCCGGGGTGAGAACGGGGGACTCATTCCTC diff --git a/pygtftk/data/mini_real_10M/expected_sequence_minus_rv.fa b/pygtftk/data/mini_real_10M/expected_sequence_minus_rv.fa new file mode 100644 index 00000000..dcfa7d0a --- /dev/null +++ b/pygtftk/data/mini_real_10M/expected_sequence_minus_rv.fa @@ -0,0 +1,92 @@ +>ENST00000338370 +CGAGGTCGGGCTTGGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGGGTCCGGGCGCCAGGCAACGCGATTCGCGCGGGGGTGAACCCGGGGAGGGGGCCGGCCTCCCCGTTCTGGGACCTTTCGGTGCGTCCGAGCGCGACACCGCCCGCGTCGGGGGCTTGGGAGCCTCGGGGCGCGAGCTGTGTTGGAAGCAAAGTCCTCCTTGTGGGTTGGGGTGGCGGAGGGAGAAGGGAAGCGAGGGTCGCGGCGGGACCAGACGCCCCAGTCCCGGCCCGCCCGCGACTACTGAAGGCGCTGCCGCCTGACCTGAACGGGCACTTGTGTTCCAGCTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAGGCGGCCGCCCGCCTTGGCCCGTCTCTGGAGTGCTGGGCAGCCGGGTCTGCGGGCCCCTTTACAGCACATCGCCGGCCGGCCCAGGTAGGGCGGCCTCTCTCCCTCGCAAGGGGGCCCAGCTGGAGCTGGAGGAGATGCTGGTCCCCAGGAAGATGTCCGTCAGCCCCCTGGAGAGCTGGCTCACGGCCCGCTGCTTCCTGCCCAGACTGGATACCGGGACCGCAGGGACTGTGGCTCCACCGCAATCCTACCAGTGTCCGCCCAGCCAGATAGGGGAAGGGGCCGAGCAGGGGGATGAAGGCGTCGCGGATGCGCCTCAAATTCAGTGCAAAAACGTGCTGAAGATCCGCCGGCGGAAGATGAACCACCACAAGTACCGGAAGCTGGTGAAGAAGACGCGGTTCCTGCGGAGGAAGGTCCAGGAGGGACGCCTGAGACGCAAGCAGATCAAGTTCGAGAAAGACCTGAGGCGCATCTGGCTGAAGGCGGGGCTAAAGGAAGCCCCCGAAGGCTGGCAGACCCCCAAGATCTACCTGCGGGGCAAATGAGTCTGGCGCCGCCCTTCCCGCCCGTTGCTGCTGTGATCCGTAGTAATAAATTCTCAGAGGACTCAGCCTTT +>ENST00000338338 +GGAATCCGGCCCCTGGGTGGTCCGGAAACGATTCTGGACCTGCGGGTATATCCAGGGCCCGCACCCCCTGGGATTGTGGGAAATGTAGTTTTTTGCCTCCGTAAGGGACCAGGCGGAGCTGAGGAACCGCGCGAGGACTGGGACCGTGATTCCACTAACCGGAAACCGTCGCCTTTCGGGCCCGGCGGGGCCTGAGCCAATGCAGAATCGGGGGCCGCGAGGACGCCAGCGGGCGCTGTGCGTAGGAACCGCCGGGTGGCCGCTGCCGATCGGGGCCGACTTGGGGACGGACCGGAAGTGCCCGAGGGCGGCCGCAGAACGGTCAATTTGAGCCGCGTCGAGCTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAGGCGGCCGCCCGCCTTGGCCCGTCTCTGGAGTGCTGGGCAGCCGGGTCTGCGGGCCCCTTTACAGCACATCGCCGGCCGGCCCAGGTAGGGCGGCCTCTCTCCCTCGCAAGGGGGCCCAGCTGGAGCTGGAGGAGATGCTGGTCCCCAGGAAGATGTCCGTCAGCCCCCTGGAGAGCTGGCTCACGGCCCGCTGCTTCCTGCCCAGACTGGATACCGGGACCGCAGGGACTGTGGCTCCACCGCAATCCTACCAGTGTCCGCCCAGCCAGATAGGGGAAGGGGCCGAGCAGGGGGATGAAGGCGTCGCGGATGCGCCTCAAATTCAGTGCAAAAACGTGCTGAAGATCCGCCGGCGGAAGATGAACCACCACAAGTACCGGAAGCTGGTGAAGAAGACGCGGTTCCTGCGGAGGAAGGTCCAGGAGGGACGCCTGAGACGCAAGCAGATCAAGTTCGAGAAAGACCTGAGGCGCATCTGGCTGAAGGCGGGGCTAAAGGAAGCCCCCGAAGGCTGGCAGACCCCCAAGATCTACCTGCGGGGCAAATGAGTCTGGCGCCGCCCTTCCCGCCCGTTGCTGCTGTGATCCGTAGTAATAAATTCTCAGAGGACTCAGCCTTT +>ENST00000321751 +TTTGAGCCGCGTCGAGGTCGGGCTTGGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGGCTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAGGCGGCCGCCCGCCTTGGCCCGTCTCTGGAGTGCTGGGCAGCCGGGTCTGCGGGCCCCTTTACAGCACATCGCCGGCCGGCCCAGGTAGGGCGGCCTCTCTCCCTCGCAAGGGGGCCCAGCTGGAGCTGGAGGAGATGCTGGTCCCCAGGAAGATGTCCGTCAGCCCCCTGGAGAGCTGGCTCACGGCCCGCTGCTTCCTGCCCAGACTGGATACCGGGACCGCAGGGACTGTGGCTCCACCGCAATCCTACCAGTGTCCGCCCAGCCAGATAGGGGAAGGGGCCGAGCAGGGGGATGAAGGCGTCGCGGATGCGCCTCAAATTCAGTGCAAAAACGTGCTGAAGATCCGCCGGCGGAAGATGAACCACCACAAGTACCGGAAGCTGGTGAAGAAGACGCGGTTCCTGCGGAGGAAGGTCCAGGAGGGACGCCTGAGACGCAAGCAGATCAAGTTCGAGAAAGACCTGAGGCGCATCTGGCTGAAGGCGGGGCTAAAGGAAGCCCCCGAAGGCTGGCAGACCCCCAAGATCTACCTGCGGGGCAAATGAGTCTGGCGCCGCCCTTCCCGCCCGTTGCTGCTGTGATCCGTAGTAATAAATTCTCAGAGGACTCAGCCT +>ENST00000378853 +TCAATTTGAGCCGCGTCGAGGTCGGGCTTGGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGGGTCCGGGCGCCAGGCAACGCGATTCGCGCGGGGGTGAACCCGGGGAGGGGGCCGGCCTCCCCGTTCTGGGACCTTTCGCTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAGGCGGCCGCCCGCCTTGGCCCGTCTCTGGAGTGCTGGGCAGCCGGGTCTGCGGGCCCCTTTACAGCACATCGCCGGCCGGCCCAGGTAGGGCGGCCTCTCTCCCTCGCAAGGGGGCCCAGCTGGAGCTGGAGGAGATGCTGGTCCCCAGGAAGATGTCCGTCAGCCCCCTGGAGAGCTGGCTCACGGCCCGCTGCTTCCTGCCCAGACTGGATACCGGGACCGCAGGGACTGTGGCTCCACCGCAATCCTACCAGTGTCCGCCCAGCCAGATAGGGGAAGGGGCCGAGCAGGGGGATGAAGGCGTCGCGGATGCGCCTCAAATTCAGTGCAAAAACGTGCTGAAGATCCGCCGGCGGAAGATGAACCACCACAAGTACCGGAAGCTGGTGAAGAAGACGCGGTTCCTGCGGAGGAAGGTCCAGGAGGGACGCCTGAGACGCAAGCAGATCAAGTTCGAGAAAGACCTGAGGCGCATCTGGCTGAAGGCGGGGCTAAAGGAAGCCCCCGAAGGCTGGCAGACCCCCAAGATCTACCTGCGGGGCAAATGAGTCTGGCGCCGCCCTTCCCGCCCGTTGCTGCTGTGATCCGTAGTAATAAATTCTCAGAGGACTC +>ENST00000489799 +GGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGGGTCCGGGCGCCAGGCAACGCGATTCGCGCGGGGGTGAACCCGGGGAGGGGGCCGGCCTCCCCGTTCTGGGACCTTTCGCTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAGGTAGGAAGCCGCGCGGGGGCGGATGGGAGGATGCACACCTGGTTAGGAGTGCGGGTCTCAGCAGCTCCGCTGGGGCAGGGCCGGTGGCCACACACACACTCTTTCCCCTCTAAGCTTCCGATGCTCACAGAGGGAACCTCAGGGGTTCAGGCCAGGAATGAGGTGCGGGGGATCCTCGCTGGGACGAACCTGCTGCTCCTCAACCCGACGGGCCTGTGTGGTCTCGCGAGCGGTGACCGTGGCGTCTGGTTTTCTGCAGGCGGCCGCCCGCCTTGGCCCGTCTCTGGAGTGCTGGGCAGCCGGGTCTGCGGGCCCCTTTACAGCACATCGCCGGCCGGCCCAGGTAGGGCGGCCTCTCTCCCTCGCAAGGGGGCCCAGCTGGAGCTGGAGGAGATGCTGGTCCCCAGGAAGATGTCCGTCAGCCCCCTGGAGAGCTGGCTCACGGCCCGCTGCTTCCTGCC +>ENST00000496905 +GTCGAGGTCGGGCTTGGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGGGTCCGGGCGCCAGGCAACGCGATTCGCGCGGGGGTGAACCCGGGGAGGGGGCCGGCCTCCCCGTTCTGGGACCTTTCGGTGCGTCCGAGCGCGACACCGCCCGCGTCGGGGGCTTGGGAGCCTCGGGGCGCGAGCTGTGTTGGAAGCAAAGTCCTCCTTGTGGGTTGGGGTGGCGGAGGGAGAAGGGAAGCGAGGGTCGCGGCGGGACCAGACGCCCCAGTCCCGGCCCGCCCGCGACTACTGAAGGCGCTGCCGCCTGACCTGAACGGGCACTTGTGTTCCAGCTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAGCTTCCGATGCTCACAGAGGGAACCTCAGGGGTTCAGGCCAGGAATGAGGTGCGGGGGATCCTCGCTGGGACGAACCTGCTGCTCCTCAACCCGACGGGCCTGTGTGGTCTCGCGAGCGGTGACCGTGGCGTCTGGTTTTCTGCAGGCGGCCGC +>ENST00000378602 +TCCGCTGTCGCCCAGTCCCGGCCGCTGGCGGGAACTGACCTGGAGCAAGCAGGACCTTCCCTCCCACCTCTCCCGCCTGGCCTCCGCGGGAGTCCCCTACGATCCCGCTCAGCAGTGGGGCACTCGCTGAGGACAGCGAGTCCTGGGAGTGAGCCCAAGGCCACCCCTGGCCAGCCCAGGAGAGATAGCCAGGGCAGGCCCAGCAGCCCGAGGCCAGGCTCTGGCCACGGCGGTCTCCGACATGGAGAGACATTGTCTGCTTTTTATCCTGTTAACCTGTCTTCGGTGGTTGTGCCACGACATTCCCCAGGGTGCAGGTGCCCGGTGGCCGAGGGTCAGTCCAGTGGTAGAGCCTTGCTCTCCTAGGCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACAGCTGGTTGTGTCCGGTTCTGCTGCCTCCGGAAGCAGGCACAGGCCCAGCCACATCTGCCACCAGCACGGCAGCCCTGCGACGTGGCAGTCATCCCTATGGACAGTGACAGCCCTGTACACAGCACTGTGACCTCCTACAGCTCCGTGCAGTACCCACTGGGCATGCGGTTGCCCCTGCCCTTTGGGGAGCTGGACCTGGACTCCATGGCTCCTCCTGCCTACAGCCTGTACACCCCGGAGCCTCCACCCTCCTACGATGAAGCTGTCAAGATGGCCAAGCCCAGAGAGGAAGGACCAGCACTCTCCCAGAAACCCAGCCCTCTCCTTGGGGCCTCGGGCCTAGAGACCACTCCAGTGCCCCAGGAGTCGGGCCCCAATACTCAACTACCACCTTGTAGCCCTGGTGCCCCTTGAAGGAGGTAGGAGAACGGACCAGAGCTTGGAGAACTAATGCTTGGAGCCAAGGGCCCCAGCCCACCCCACCGTCCCACACATTGCTGTGGCCCCAACCTCGGTGCCATGTTACACCGGCCCCTGGCGTCACCCACTAGGCAGGCTGCTGCTTTCAGCCTCAGCCCCTGGCCCAGCCCCAGCAGGCCCTCAGCCTGGAAGAGGCCCCTTGGGCCTAAGCCTCGGGTGGGAGCTCAGGGCCACCTGTGACGTCTGCATCTTCTTGGAGAGAGAATAAAGTTTGTATTTAAGTGGT +>ENST00000310991 +CTCAGAGCATGGCCCGGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAGGTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCAGTGCCCGCCCCAGGCCCGCTGGAGCAGCCTGTGGCACGTGGGGCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACAGCTGGTTGTGTCCGGTTCTGCTGCCTCCGGAAGCAGGCACAGGCCCAGCCACATCTGCCACCAGCACGGCAGCCCTGCGACGTGGCAGTCATCCCTATGGACAGTGACAGCCCTGTACACAGCACTGTGACCTCCTACAGCTCCGTGCAGTACCCACTGGGCATGCGGTTGCCCCTGCCCTTTGGGGAGCTGGACCTGGACTCCATGGCTCCTCCTGCCTACAGCCTGTACACCCCGGAGCCTCCACCCTCCTACGATGAAGCTGTCAAGATGGCCAAGCCCAGAGAGGAAGGACCAGCACTCTCCCAGAAACCCAGCCCTCTCCTTGGGGCCTCGGGCCTAGAGACCACTCCAGTGCCCCAGGAGTCGGGCCCCAATACTCAACTACCACCTTGTAGCCCTGGTGCCCCTTGAAGGAGGTAGGAGAACGGACCAGAGCTTGGAGAACTAATGCTTGGAGCCAAGGGCCCCAGCCCACCCCACCGTCCCACACATTGCTGTGGCCCCAACCTCGGTGCCATGTTACACCGGCCCCTGGCGTCACCCACTAGGCAGGCTGCTGCTTTCAGCCTCAGCCCCTGGCCCAGCCCCAGCAGGCCCTCAGCCTGGAAGAGGCCCCTTGGGCCTAAGCCTCGGGTGGGAGCTCAGGGCCACCTGTGACGTCTGCATCTTCTTGGAGAGAGAATAAAGTTTGTATTTAAGTGG +>ENST00000378598 +GGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAGGTGGGTCGGGCGGCGTTCTCTCTCGGTTCGGCCACCGCGGGGCGGGTCCCTGCTCGGACCACGCCCCTCCCGGGCTCACCCTTGTCCCCACAGGTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCAGTGCCCGCCCCAGGCCCGCTGGAGCAGCCTGTGGCACGTGGGCCTGTACACCCCGGAGCCTCCACCCTCCTACGATGAAGCTGTCAAGATGGCCAAGCCCAGAGAGGAAGGACCAGCACTCTCCCAGAAACCCAGCCCTCTCCTTGGGGCCTCGGGCCTAGAGACCACTCCAGTGCCCCAGGAGTCGGGCCCCAATACTCAACTACCACCTTGTAGCCCTGGTGCCCCTTGAAGGAGGTAGGAGAACGGACCAGAGCTTGGAGAACTAA +>ENST00000470931 +AGAGCATGGCCCGGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAGGTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCAGTAAGTCGGGGGGGAGGGAGCCGGGGCCTGGCCCCGCCCTATGGGGAGGCACGGGTGGCGAGGTCGGCCGTCCCATGCCCCGCCTGCTCCAGGTGCCGCCGTCCCCACAGGTGCCCGCCCCAGGCCCGCTGGAGCAGCCTGTGGCACGTGGGGCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACAGCTGGTTGTGTCCGGTTCTGCTGCCTCCGGAAGCAGGCACAGGCCCAGCCACATCTGCCACCAGCACGGCAGCCCTGCGACGTGGCAGTCATCCCTATGGACAGTGACAGCCCTGTACACAGCACTGTGACCTCCTACAGCTCCGTGCAGTACCCACTGGGCATGCGGTTGCCCCTGCCCTTTGGGGAGCTGGACCTGGACTCCATGGCTCCTCCTGCCTACAGCCTGTACACCCCGGAGCCTCCACCCTCCTACGATGAAGCTGTCAAGATGGCCAAGCCCAGAGAGGAAGGACCAGCACTCTCCCAGAAACCCAGCCCTCTCCTTGGGGCCTCGGGCCTAGAGACCACTCCAGTGCC +>ENST00000602604 +GAGCATGGCCCGGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAGGTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCAGTGCCCGCCCCAGGCCCGCTGGAGCAGCCTGTGGCACGTGGGGTAAGTGGAGGCCGCGGCGGAGCCGTGCGTCCGACGGTTCTGGGGCGGGGGTCACCGGGGCCAGGCCCGCCAGGCCCTTACCTCACCAGGCCGCCTCCGCTGTCGCCCAGTCCCGGCCGCTGGCGGGAACTGACCTGGAGCAAGCAGGACCTTCCCTCCCACCTCTCCCGCCTGGCCTCCGCGGGAGTCCCCTACGATCCCGCTCAGCAGTGGGGCACTCGCTGAGGACAGCGAGTCCTGGGAGTGAGCCCAAGGCCACCCCTGGCCAGCCCAGGAGAGATAGCCAGGGCAGGCCCAGCAGCCCGAGGCCAGGCTCTGGCCACGGCGGTCTCCGACATGGAGAGACATTGTCTGCTTTTTATCCTGTTAACCTGTCTTCGGTGGTTGTGCCACGACATTCCCCAGGGTGCAGGTGCCCGGTGGCCGAGGGTCAGTCCAGTGGTAGAGCCTTGCTCTCCTAGGCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACAGCTGGTTGTGTCCGGTTCTGCTGCCTCCGGAAGCAGGCACAGGCCCAGCCACATCTGCCACCAGCACGGCAGCCCTGCGACGTGGCAGTCATCCCTATGGACAGTGACAGCCCTGTACACAGCACTGTGACCTCCTACAGCTCCGTGCAGTACCCACTGGGCATGCGGTTGCCCCTGCCCTTTGGGGAGCTGGACCT +>ENST00000416272 +GAGCATGGCCCGGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAGGTGGGTCGGGCGGCGTTCTCTCTCGGTTCGGCCACCGCGGGGCGGGTCCCTGCTCGGACCACGCCCCTCCCGGGCTCACCCTTGTCCCCACAGGTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCAGTGCCCGCCCCAGGCCCGCTGGAGCAGCCTGTGGCACGTGGGGCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACA +>ENST00000400919 +CTCACTTCCGCCCGGCGCGGGCTTGGATGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGTACTTCAACTCCCGCCCCCACCTGTGTCCCGCTGGCTCCTAAGCTGCCCCCCTACGTGTGGGTTGCGTCTGAGATGTGGGGCAGGCGCCACTCACGGAAAAAAGGCATCAGAGGAGCTTCCACATCATCGGAACATTTTATTCCTCAGGACGCTACACGCTCACTTTCCTGGCGGAGCAGGTCAGTGCATCGAGTTCTGTTTCCGTGGAAAATGTGCACCTTGGAAACCGCATGACAGCCCCCTCGGCAGGGTCCCCGCGGATCCGCCGCGACGCAGGCACAGCAGCAAGTTCCTCCAGCACGAAGCTGGCCTGCCCGGGCCCAGGTGTGAGGGACTGTTCTGCTCCCAGCAGCGCCCGCTGACGCTTCCCTCTGCGGTCTCGGCGCAAGCGTCTGTCCCTGGCCGCCCTCGGAGCCGTGCCCAGCCTGGCATGCATATGCGGTGGTTAAGGATACAGTTAAAGGGTCAATCACGCGTGTCCACGACAGAGACGCACGCGGCCTCACACCGACTCCTCGGTGGACAGCAATAATGGGTTGATATACTCAAAGCCTTCGAACTCTGACTGGTCGATCCTCTTTATGGCATCCCTGTGGGCAAAGGTGGCAGGGGGGAGGGGGGTGACCGTGTGTTCATTCCCTTGGGGGAAGCGGAGTCACGTTCGCATAAGAATCCTCCCCCAACGCCCACTGGAGAGATGACACCAGGCGGGTGGGACTCAAGGGCAGGCTGGGTCACCAGCTGCCCAAGGTGCCGGCCTGCCATGGGGCTGCCCGAGGGGTGCTCCAGGGACCCGCACCCAGTGGGACTCACTCATCGTCTGGGGTCAGCTGCACGGGCTCGCTGGTGAACTGTGTGTCAAAGTTGTCCAGACCGTAGTCGTCTGTGATCTGTGGCTGGAATGGAGGGAGCGCCTGCTTCTTCTCCAGCTTGGAAAAACAATAGGAGAAGGGTCAGCTCCGCGCGGGCATCATCCCTACCAGATTGAGTGTTTTGCACGCACTTCAATCACAAAATGAAACAGTGAGAAAGTCAGCATTTCAATCTGCCT +>ENST00000469733 +CTTTTGTGGGGTCAGTGCCCACAGGGTTGAGCACCACGTGCCTGGCTGGGCAGTGCTCCTGCCAGGGTCCCCTTCTCCACTGTAGGAAACACGGCTGCTCCTGCAGCCGCGTCTGCTCTGCTGCATCTCCAGCTCCTGCCAGGCATGGTGTGCGCGGCCCCAAGACAGGGAGTTTCCATAGAGACAGGGTTTCACCGTGTTAGCCAGGATGGTCTCGATCTCCTGACCTCGTGATCCGCCCGCCTCGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCACGCCCGGCCCCCAGAGCCTTAGTCTCAGAATCACACCCACCCCACGCCCAGGGCGTCTGTCACAGCTTTCCAATCCATGAGCCCATCAATCGGACTGGACACAGATAAACTGGGACAGGACGCCGGGTGGCAAAGGCCGGGAGAGCTGGGCCACTCCCTCCAAAAGGCCCCAGACGCAGCTGCATCCTGGAGTCCTTCTGAGAAATGTGGGACCTGCCCCAGCTCCACCCCAGGTGAGGGGCACCAGCCAGCTCCAGAGCTGCCTACCTTCCCTGTCAGGTGCACAGGTCAGCGCCAGGCCAACCCCAGAGCGAGAACACCTGTGCTGGACTGAGCTGGAGCAGCAGGGTGGCCTGCACCGGGGCAGCGAGGGAGGCGTTGGATGGAGCCACCCCACGGCTCCTCTGTGAAGGTCTGCACGTCACTCAGAAAGTTGAAGCAAACCAAGCAGGGTTGGAGCCCACAGTTCACAGCCGGCTGCACAGGGGATGCACCAAGCACAGTTTCCTATGACAAGTGGAAACCTGTGCGCCACAGCAAAACTCCGTCACCACAGCAGCAGATGGCTCCGAAGAAGTGGAGCGTTTTCATCAGGTTCAACTTTGAAACCTCCACCATCACCATCACCAGCACCGCTGTGTCATGCTGATAACTTGAGGACAGGCAGGACAAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGTACTTCAACTCCCGCCCCCACCTGTGTCCCGCTGGCTCCTAAGCTGCCCCCCTACGTGTGGGTTGCGTCTGAGATGTGGGGCAGGCGCCACTCACGGAAAAAAGGCATCAGAGGAGCTTCCACATCATCGGAACATTTTATTCCTCAGGACGCTACACGCTCACTTTCCTGGCGGAGCAGGTCAGTGCATCGAGTTCTGTTTCCGTGGAAAATGTGCACCTTGGAAACCGCATGACAGCCCCCTCGGCAGGGTCCCCGCGGATCCGCCGCGACGCAGGCACAGCAGCAAGTTCCTCCAGCACGAAGCTGGCCTGCCCGGGCCCAGGTGTGAGGGACTGTTCTGCTCCCAGCAGCGCCCGCTGACGCTTCCCTCTGCGGTCTCGGCGCAAGCGTCTGTCCCTGGCCGCCCTCGGAGCCGTGCCCAGCCTGGCATGCATATGCGGTGGTTAAGGATACAGTTAAAGGGTCAATCACGCGTGTCCACGACAGAGACGCACGCGGCCTCACACCGACTCCTCGGTGGACAGCAATAATGGGTTGATATACTCAAAGCCTTCGAACTCTGACTGGTCGATCCTCTTTATGGCATCCCTGTGGGCAAAGGTGGCAGGGGGGAGGGGGGTGACCGTGTGTTCATTCCCTTGGGGGAAGCGGAGTCACGTTCGCATAAGAATCCTCCCCCAACGCCCACTGGAGAGATGACACCAGGCGGGTGGGACTCAAGGGCAGGCTGGGTCACCAGCTGCCCAAGGTGCCGGCCTGCCATGGGGCTGCCCGAGGGGTGCTCCAGGGACCCGCACCCAGTGGGACTCACTCATCGTCTGGGGTCAGCTGCACGGGCTCGCTGGTGAACTGTGTGTCAAAGTTGTCCAGACCGTAGTCGTCTGTGATCTGTGGCTGGAATGGAGGGAGCGCCTGCTTCTTCTCCAGCTTGGAAAAACAATAGGAGAAGGGTCAGCTCCGCGCGGGCATCATCCCTACCAGATTGAGTGTTTTGCACGCACTTCAATCACAAAATGAAACAGTGAGAAAGTCAGCATTTCAATCTG +>ENST00000414253 +CTCACTTCCGCCCGGCGCGGGCTTGGATGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGTCTTTCATGGATGTGCAAGACTTTGAATGACCCTGGCAGTCAAGGGTGAGTGTCATCCACAGGAGAGCCGGCCAGCCACGGGCTCCATGGGCAGTTGCCCCGCACCACGCCCACGCAGGCCCACTGTGCAGCCCCCAAGTCACCAGAGTTTTCGAGAACCACTTCCAAAAGACACCGTCGTGACCGGAGCCATTAGCAAATATCAGGATTTTTCAAACCACACTTCAATACATCCTTCACTTTAATTTATAAAACAAATTACTGAATATAAAAGTCTCCCCTCTGATGAGCACAGCATTACTCACATATTGTGTACAAGAACGGCCAAACTGGTAACCGGCACGCTACTGGCAACACGGCAGTATTTAGCCACCAGCCGCACAATGGGGTGGAGCGGCCCCTGAGTCATGGAGGCCTGGGGTCTCTGCGCCTGGCCAAGAGGGCTGCGTGGCAATTTCCACACCTGTGCACCAGGCCTCACTCAGAGGCATGAGGTGGCGCGACCCCCTCTCCCAGGGAGCTCAGAAGACGGCTCTGCCACACCTGACACCTGGCAGCTGGCAGCCCTGCCTCTAGGAAGCCTCAGCTCTGGACAGCTGTGCCTTCACCTGAGGGGTACTTCAACTCCCGCCCCCACCTGTGTCCCGCTGGCTCCTAAGCTGCCCCCCTACGTGTGGGTTGCGTCTGAGATGTGGGGCAGGCGCCACTCACGGAAAAAAGGCATCAGAGGAGCTTCCACATCATCGGAACATTTTATTCCTCAGGACGCTACACGCTCACTTTCCTGGCGGAGCAGGTCAGTGCATCGAGTTCTGTTTCCGTGGAAAATGTGCACCTTGGAAACCGCATGACAGCCCCCTCGGCAGGGTCCCCGCGGATCCGCCGCGACGCAGGCACAGCAGCAAGTTCCTCCAGCACGAAGCTGGCCTGCCCGGGCCCAGGTGTGAGGGACTGTTCTGCTCCCAGCAGCGCCCGCTGACGCTTCCCTCTGCGGTCTCGGCGCAAGCGTCTGTCCCTGGCCGCCCTCGGAGCCGTGCCCAGCCTGGCATGCATATGCGGTGGTTAAGGATACAGTTAAAGGGTCAATCACGCGTGTCCACGACAGAGACGCACGCGGCCTCACACCGACTCCTCGGTGGACAGCAATAATGGGTTGATATACTCAAAGCCTTCGAACTCTGACTGGTCGATCCTCTTTATGGCATCCCTGTGGGCAAAGGTGGCAGGGGGGAGGGGGGTGACCGTGTGTTCATTCCCTTGGGGGAAGCGGAGTCACGTTCGCATAAGAATCCTCCCCCAACGCCCACTGGAGAGATGACACCAGGCGGGTGGGACTCAAGGGCAGGCTGGGTCACCAGCTGCCCAAGGTGCCGGCCTGCCATGGGGCTGCCCGAGGGGTGCTCCAGGGACCCGCACCCAGTGGGACTCACTCATCGTCTGGGGTCAGCTGCACGGGCTCGCTGGTGAACTGTGTGTCAAAGTTGTCCAGACCGTAGTCGTCTGTGATCTGTGGCTGGAATGGAGGGAGCGCCTGCTTCTTCTCCAGCTTGGAAAAACAATAGGAGAAGGGTCAGCTCCGCGCGGGCATCATCCCTACCAGATTGAGTGTTTTGCACGCACTTCAATCACAAAATGAAACAGTGAGAAAGTC +>ENST00000428120 +GGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGAAGCAAAAACAGCTCGGGAATGCGAAGGCACCGGAGTCCAAAGTTGGCAGCCAACAACAACAACAACAAAAGAAAAGGCCGGGCACGGTGGCTCACGCCTGTAATCCCAGCCCTTTGAGAGGCTGAGGCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGTCTTTCATGGATGTGCAAGACTTTGAATGACCCTGGCAGTCAAGGGTGAGTGTCATCCACAGGAGAGCCGGCCAGCCACGGGCTCCATGGGCAGTTGCCCCGCACCACGCCCACGCAGGCCCACTGTGCAGCCCCCAAGTCACCAGAGTTTTCGAGAACCACTTCCAAAAGACACCGTCGTGACCGGAGCCATTAGCAAATATCAGGATTTTTCAAACCACACTTCAATACATCCTTCACTTTAATTTATAAAACAAATTACTGAATATAAAAGTCTCCCCTCTGATGAGCACAGCATTACTCACATATTGTGTACAAGAACGGCCAAACTGGTAACCGGCACGCTACTGGCAACACGGCAGTATTTAGCCACCAGCCGCACAATGGGGTGGAGCGGCCCCTGAGTCATGGAGGCCTGGGGTCTCTGCGCCTGGCCAAGAGGGCTGCGTGGCAATTTCCACACCTGTGCACCAGGCCTCACTCAGAGGCATGAGGTGGCGCGACCCCCTCTCCCAGGGAGCTCAGAAGACGGCTCTGCCACACCTGACACCTGGCAGCTGGCAGCCCTGCCTCTAGGAAGCCTCAGCTCTGGACAGCTGTGCCTTCACCTGAGGGGTACTTCAACTCCCGCCCCCACCTGTGTCCCGCTGGCTCCTAAGCTGCCCCCCTACGTGTGGGTTGCGTCTGAGATGTGGGGCAGGCGCCACTCACGGAAAAAAGGCATCAGAGGAGCTTCCACATCATCGGAACATTTTATTCCTCAGGACGCTACACGCTCACTTTCCTGGCGGAGCAGGTCAGTGCATCGAGTTCTGTTTCCGTGGAAAATGTGCACCTTGGAAACCGCATGACAGCCCCCTCGGCAGGGTCCCCGCGGATCCGCCGCGACGCAGGCACAGCAGCAAGTTCCTCCAGCACGAAGCTGGCCTGCCCGGGCCCAGGTGTGAGGGACTGTTCTGCTCCCAGCAGCGCCCGCTGACGCTTCCCTCTGCGGTCTCGGCGCAAGCGTCTGTCCCTGGCCGCCCTCGGAGCCGTGCCCAGCCTGGCATGCATATGCGGTGGTTAAGGATACAGTTAAAGGGTCAATCACGCGTGTCCACGACAGAGACGCACGCGGCCTCACACCGACTCCTCGGTGGACAGCAATAATGGGTTGATATACTCAAAGCCTTCGAACTCTGACTGGTCGATCCTCTTTATGGCATCCCTGTGGGCAAAGGTGGCAGGGGGGAGGGGGGTGACCGTGTGTTCATTCCCTTGGGGGAAGCGGAGTCACGTTCGCATAAGAATCCTCCCCCAACGCCCACTGGAGAGATGACACCAGGCGGGTGGGACTCAAGGGCAGGCTGGGTCACCAGCTGCCCAAGGTGCCGGCCTGCCATGGGGCTGCCCGAGGGGTGCTCCAGGGACCCGCACCCAGTGGGACTCACTCATCGTCTGGGGTCAGCTGCACGGGCTCGCTGGTGAACTGTGTGTCAAAGTTGTCCAGACCGTAGTCGTCTGTGATCTGTGGCTGGAATGGAGGGAGCGCCTGCTTCTTCTCCAGCTTGGAAAAACAATAGGAGAAGGGTCAGCTCCGCGCGGGCATCATCCCTACCAGATTGAGTGTTTTGCACGCACTTCAATCACAAAATGAAACAGTGAGAAAGTC +>ENST00000400918 +GGATGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGTACTTCAACTCCCGCCCCCACCTGTGTCCCGCTGGCTCCTAAGCTGCCCCCCTACGTGTGGGTTGCGTCTGAGATGTGGGGCAGGCGCCACTCACGGAAAAAAGGCATCAGAGGAGCTTCCACATCATCGGAACATTTTATTCCTCAGGACGCTACACGCTCACTTTCCTGGCGGAGCAGGTCAGTGCATCGAGTTCTGTTTCCGTGGAAAATGTGCACCTTGGAAACCGCATGACAGCCCCCTCGGCAGGGTCCCCGCGGATCCGCCGCGACGCAGGCACAGCAGCAAGTTCCTCCAGCACGAAGCTGGCCTGCCCGGGCCCAGGTGTGAGGGACTG +>ENST00000497675 +CTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGTGAGTAGGCCACCCCTGCGCCCGGCCCGGTTATCCATCCGTGTTTGGAAACCACAGCCGTTCAGAAGGTCAAGAGGTGGCCGAGCTCAGCGCTGGCTTTTAAAGCCCTGTTTCACACTGGAAAGGTGGCCCAGTGCTGTGGCCTGGCATGTCCAGGTGGCTCTCTGTCACGGGTCTGGGGTCCACCTGCTTGCCGTGCTCTGTGGGCAGGGCAGGCTGGGGGCCCACAGAACAGCACAGAAGGAAGGCTGGGAGCACTGGCCCCGGGTCCACCTGGCCATCCTGGAATCTGGTGGCACCAGCGTCCCCAGGCCCAGAGCACAGGAACACCTTCCCGAGAGTGCGTCATGGGTTTTAAAAATGAAGATCGTCTTTTTTGTCTGGAGATGCTTTTTCTTATTTTTGAAACCCAACGTATATTTTTATGTATTTTTTAAGTAAAGGGGAATGGAACCCAGTTTTGCTAACAAGATAACCCAAACTGCCCAGTGCCTGGCCTTGTGTCTGGCGACCTCTGGGCCCTTGGCCTCCGGAGCAGGTCCTGGGGCTGGGGTGGTGTGAATGATGCTGGTTCGTAACTTTTGGTTGAGTTAATGGGCGGCAGGTTTCAGAGCTTATGGAGACCAGGTCCTTCAGTCATGCCTGATGCCCCTGGTCTTCCAGAAGCAAAAACAGCTCGGGAATGCGAAGGCACCGGAGTCCAAAGTTGGCAGCCAACAACAACAACAACAAAAGAAAAGGCCGGGCACGGTGGCTCACGCCTGTAATCCCAGCCCTTTGAGAGGCTGAGGCAGGTGGGTTGCTGGAGCCCAGGAGTTTGAGACCAGCCTGGGCAACATGGCAAGATCCCATCTTTACATGCCTGGGCGTGGTGGCGCGTGCCTGTGGTCCTAGCTACTCTGGAGGCTGAAGTGGGAGGATTCCCTTGAGCCAGGAATTGGAGGCTGTAGTGAAGTATGATTGCACCACTGCACTCCAGCCTGGGTGACAGAGTAAGACCCTGAATCACGGACAGAGGGTACTGTTGGGAGCCCTGGGGAGAAATCCATGCTCTTGGCTGAAGCTCTGAGATCCTTGTTGCTGTCAGGGTGCTGCCCCCCGCCCCCCGGGGAGGGGCTTTTGTCTTTGCATCGCCTGCTTTTCCAGATAGTCTAAAAAAAGACTTCTGAAGACAAGGACGTTCACGAGGAAAAACTTGCCATTTTGAGCTTTTTAAGCAGTTGCTGAAAGCTTGGCAGACTGCCTCAATTTTTCCTAAGTAGGCGTCAATGAAGTCAGGTCCAGGCCTTGGTGTGTCTGGAATGCTTCAAGCACATTCGAACACTTGATCGTAAGGGAGAGCCGGTACTTTGGAACCGGAACTCACCCGAGGCTGTGGCCACCGCATGGGCAGGCTAGCTGGGGGACAAGCCCCATATCTTTGGGAACAAGGGTTTGCACAGCCACCCTGGGATGCCCTGGGACTCCTGACCGCACAGGACCCCAGCAGGGAGGCCGCCTGGATTGGAGGGTCTGGTCTAACAGCCGGACTTGGTCTTGAACCGTCGCCCTGTCCCGCACAGGCGCCTGCTGAGCCTGGAGCCCTGGCAGAGGCGGGTCTGGGGAGTGGAGCTGCCAGGAGGCCTCCCATTTCTCACAGCCTTGGTGTTCTCCGGGTCACCCAGAGGACCGTCAAATGCTGGATTTGACAAACTATGTAGAATGTTCTTTGTGTCTTTAAGATCTTCTTGTGGTCCTATTTGGACATTTTGTGCATTTTCAGACACCTGCGGGTCACGTGGGTGGATGGGAAGCTGGGCACCTGGTGAGGGGTGAGGATGTTGAGAGCCAGAGCTGCGTTTTGTCTCTGTTGATGTGGCGAGGCCCTGGGTTGGTCACTGGGATTTTTTTTTTTTTTTGAGACGGTGTCTCGCTCTGTCGCCCAGGCTGGAGTGCAGTGGCATGATCTCGGCTCACTGCAACATCTGCCTCCCGGGTTCAAGCGATTCTCCTGCCTCAGTCTCCTGAGTAGCTGGGATTACAGGCGTCACCACACCTGGCTAATTTTTGTATTTTTAGTAGAGACAGGGTTTCACCATGTTGGTCAGGCTGGTCTTGAACTGATCTCAGGTGATCCGCCCGTCTCGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGCGCCCGGCCGGTCGTTGGGATTTTAACAGCCCTGAGGCCCCTCACGCTGCCAGGTGCCAGCCCACCCTGCAGCCCTGCTCCCCTGCCCACACGCAGAAGCCACCAGAGGCTTCTGGACTGAGCCCCCACTGTCCTGCAGCCGGGCTGGCCTGTCCACACCACAGGGCGTGCTCAGCTACTGAGCAGAAGCGTCACGGACAGGGCAGATCAGGCCAGGACAAAGCTCTTCCGCCACAGGCGGGGGTCTGAAGGCATCTCAGAGGGCCCCCAAACAAGGGACGCTGCCTGGAAACCCCGGGACAAGATGACCTCGGTTCAGATCTTAGCACCTTCTGGCAACCTTAGAGAAAGCTTCTGGAGGGAGGGGCTGGTTCCCAGGATGGGCAGAAGCCGGAAAGTCTCAGACTGAGTGACCCTCGGGGGCTTCAGAAGGCACTGGGTGGGCTCTGCCAGAGTGAGAAGGCAGCTGATGGCTGCTGGAGCCAGCCCCGGGAGTGGGGGTCCAGCTATGGTCTGGAGAGGGGGACTTGAGGGTTGCAGTGGCCACACAGACGGGGCACAGGAGCCAAAGGAAGGGACACAGCAAAGCCCAAGGGTAAAACGGCGCGCCGTGGACTGGTCTGAGGGCAGAGGCTGTAGGGGAGCGAGGGGCGGTGTGGCTGACAGGTGGACACAGGGACACGTGTCCTGTGGACTTGGCCGCTCAGTGGGGGTGTGTCCCCCAGCAGTGGCGTGTGAGGGATGGTCACTCTGATGGGACACTGACCACTTGGCCTCCAGCAAGATCTAGGCCCAAGTCTAGGCTGAAGCCGCCCACTCAGCCCCGGGACATCGTCCCCGGCAGCTCTGCTGAGCACGCCAGCTCCGGCACTCTCCGGGAGTCATGGCCGGAAGTCAACTGTCCTGGCTTCCAGGGCCACACCTTGGCCAGGCCTGGTGATGGTCATTTCCAGCCGCTCCAGTTGGGCTGATGGGGCCACATGAGGCCGGGGATAGAAGGTGGCTGCGCTCAGACACCCCTCCCGGCCCCACTGGATGCCCAGGGCGCTGACCTGCAGGACTCGGATGGGTTTTCTCCTGCCACCCCTGCCTGGCCGGCCACCATCCCAGCGCCAGCGCCCTCCTGAGAGGTGCAGGGGCCGCGTGGGGCCTCCCAGAGTGGCAGGTTGGCAGCCTGCACGCCGGTGACGGCGTCCTTCTCCGTGGTGAGGCTTGGTCCCTCCTCGCCAGAAACACCAATTCTCTGACGTGAGCTGCACATCCACTGCCCAGCCATGTTTACTCTTCTGCCTCCTGTAGACGCAGCCGCGGCGGCTCTCCCTGGCAGGCCACCCGCCGTCCTGCCTTTTCTCCGGGTCAGGCCGCCTGTCTGCCGGGCTCCACGATGAGCGCGTTCTCAAGCTGAGCAGGCGCCAGAATCCCATAGAGAGGCTTGTTGAGACACAGCTTCCCCACCCCCAGCTCGGACGCAGGGGCCTGGCGTGGCCTCCTCACGGGCACGGTGTGGAAACACCACTGGCGGTTACCGTGGTCTGCCGGGTGCATGAGCCCCTGGGGTGGCCCCGTCCCTTGTTTCTGACCAGCCGGATCCTCTCCAGCGGCAGGAGCAGAGAGGGCCCGGAGGTCCAGACGGTGCTCTCTGCGGCCAGCATGCCGCGGAGGTGGCCGAGTGAGTGTGGCCCCTCCCTTGCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTCTGTCTCTGTGTTGTGATGAAACGTC +>ENST00000378546 +TCACTTCCGCCCGGCGCGGGCTTGGATGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTCTGTCTCTGTGTTGTGATGAAA +>ENST00000378543 +GATGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTCTGTCTCTGTGTTGTGATGAAA +>ENST00000401813 +CGGGGTTTCACTATGTTGGCCAGGCTGGTCTAGAACTCCTGACCTCAAGTGATCTGCCCGCCTCGGCCTCCCAAAGTGCTGGGATTGCAGGCGTGAGACACTGCACCCGGACAATTTTCCTTTTCTTACAAGAACACTGCTCACACTGCATTCAGGGCCAACCCTAACCCAGTATCGCCTCATCCTGGTTTGATTATATCGGCACAGACCTTGCTTCCGAGCGAGGCCACTTTCTCAGGTACTGGTGGACATGAGTCTTCGGAGACGCTGCTCAACCCACAGTGCTCCTCCAGCTTGGTTTCTGTGACTTGCCTTCCCCAGAGGAGGGGTGCCCTGAGAGGTCTCCACTCCCTGACCGGCTCCTTGGTGCCGCGCACTCTGAGAGGCTTCCCAGGGAACAGAGCACACAGGACCGCCCTCCTGGGTAGACCAATCAGCATCTGAGCTCACAATTTCCCAGCAGGGCAGTGGGGTGGAGAGAGAAGCCTGGGCTGGGCTGGGCTGGGCTGGGCTGGGGAAGCTTCTCCGGGCGGGGGGACGTCAGAGCAGGATCTGGGGCTGATAAAAGCCCGCCCCTGGGTGGGGGCTGAGTGGTGCGGAAGCTGAGCCCGACACGTGGGGATGGAGGACAGGCTGTGGGAGGGTGTGAACCGGATACTGCTTGAAGGGGTGCTGGGGACTTTGAGAGAGGGCGGCTGGCCCTGTCTGGTCGGGGATGCTGGCCCAGACACAGGCCATGGCTGGGATGGGGTTCAGAAACAGGACCGCTGTCTCTCCCGGGCCAGGGCCCTCCCCAGCTGCTCCTGGCTTTCTGGTTCTTGGGGTCAGGGGCAGGCCTGTGCCATGACCCCGCCACTGAGGCTGTGAGGAGGCTGTCGGTGCCCAAGGGCACCAAGGCACACCCCTACTCTTGCACCCCATGTGTGGGCCCGAGCACCTGCTCTGCTGCCCCAAAGATCTGGCGATGTTTCCCAGGCAACTGTCTCTCACAGCCTGTCTGCCTGGCACTCCCGTATCCCATAAATGCCACCACATCTGGCTATGGGTGGGCGTGCCTGCCTGGCATCCACGGGCCAGCAGGTGTGGTGGAGCACAGCCCAGTTCCTGGCTGCGTCAGAAGGCTGCCCGGGCCTTTTGGCTGTCCTTGCCAGCAGGTGAGCACTGCCAGGGCACCGTGTGTGGGTGCTGGGCCATTTAGCCACATGGGAAGGGGTGGAGGCAGCCCAGTGCCTTCAGCATGTGCCCAGGGTGCCTGTCGGCCACAGGTCTCATTTGGAAATTGGGAGGGTGCACGGCCACCGGGCTGCTTAGGCCTGCCAGCCTCAGGGCCCGTCACCGCTGTCTTAGCCTGATTTGCAGGGTGTCAGCGCTGGGCAGAGATGAACATTTGGGTGACTCTGAGGATGCCAGTGGCTGGGACACTTGTTCTTCCGCGGTGGAAGGAGTTGGAGAGGCCTGGCTCCCTGACCTACGGCCAGCCTGGCTTCTGAAACCAGCTCAGTGGGCTGGGGCCTGATTCATCATCCATAAATGTGTCCTTTTTTGCCACAGAGGGTAAGGGGCCTCCTAGCCCACCGGTCTGCAGGTGCGGGAGTAGGAGATGGGTGGCTCTGATGCCCCCACCCACTCGATCACCTTCTGCTCTGCCTGGGATGCAAACTCCCACAGCTGAAACGTTCTTTTGTAAACATGAATTTTGGCTTAGAAAAAACTCATTTCCACTGTGCACGTGTCAGTCCCAACCAGAAATTATTTTCCAATAAAGCAAAACTCCGTCACCACAGCAGCAGATGGCTCCGAAGAAGTGGAGCGTTTTCATCAGGTTCAACTTTGAAACCTCCACCATCACCATCACCAGCACCGCTGTGTCATGCTGATAACTTGAGGACAGGCAGGACAAGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTCTGTCTCTGTGTTGTGATGAAA +>ENST00000487186 +GAACATGGATGCCTCGCTTTTCAGAGACTCGCGTTCTTGGAACTTACACCCTTTTGGGTTTGCTATTTTTACCCACCCTGAGCCTTCCGGTCTCCATGGCGACGCCTCCAAACAGCAGATTCCAGGCGGCAATGACGTCATCTCTCCCTTTCCTGCCGCCCAGGCCTTGGAGAGATCCAAGGCCTGTGGGCCACGGCTGCGCCTCTCCTGACTCCAGCTTGCCCGTCTGTCCTTGGGGGCAGCGTCCTTCCTTCTCTCGGCCCCAGACGCAGCTGCATCCTGGAGTCCTTCTGAGAAATGTGGGACCTGCCCCAGCTCCACCCCAGGGGCAGCGAGGGAGGCGTTGGATGGAGCCACCCCACGGCTCCTCTGTGAAGGTCTGCACGTCACTCAGAAAGTTGAAGCAAACCAAGCAGGGTTGGAGCCCACAGTTCACAGCCGGCTGCACAGGGGATGCACCAAGCACAGTTTCCTATGACAAGTGGAAACCTGTGCGCCACAGGTGAGCTGGGTCCTGGAAGGTGCAGGGACCAGGCAGCATCTCATCTCAGGACATCAAGGGCTGTCCCCAGCCAGCAGATTTCCCATAAAAACGTGCTGAACTGGGGACAAAGCTGATTCTACAGAGCCGAGAAGCCAGACCTTCCCTGGGGACTCCCGAGGGGGTCCCAGCCACCCTCTCCACCTGCAGAGGTTTCCTGGCCCACTTGGAGGACCTTGGGGGATCCTCCAAGGGCCCCCTTCCAGCTCTTGGCCCATGGGGGAGCCTCTTCCTCAGCTCCGGGTGTGGTGGACAGGAGACCGAGGGCTCCCCGCACCCAGCTGGGCTCAGCGTTTTCAAGCTGAACTTGGTGCGTGGCGGCTTGGAAAGCCGGGAGCCTGCTGCGTGTCTCCTGGGGCTGCTGTGAAAAAATGACCACACACTGGGAGCCTAAAACGAGTGACATGTATATTCTCACAGTTCAGGCAGCTGGTGTCCAAAATCAGTGGTTGGGAGGGTGGAGCTCCGCCTAAAGGCTCTGGGTGGCTGCTGCCTGCCCCTTCCAGCCCCGGGCCCCCGGCATTCCCTGGCGTGCAGCTGCTCCACCCCCAACCCCAAAGCCTCCTTCCTGTGTCTCTGTGTCCAAATTTTCCTTACCTTTTTTTTTTTTTTTTTGAGATAGAGTTTTGCTCTTGTCGCCCAGGCTGGAGTGCAACAGCACGATCTCGGCCTATCGCAACCTCCGCCTCCTGGGTTCAAGCGATTCTCCTGCCTCAGCCTCCTAAGTAGCTGGGATTACAGGTGCCCACCACCACACCCAGCTAATTTTGTATCTTTAGTAGAGATGGGGTTTCACGATGTCTTTCAGGCTGGTCTCGAACTCCTGACCTCACATGATCCACCTGCCTCGGCCTCCCAAAGTGCTGAAATTACAGGCATGAGCCACAGCACCTGGCCAATTTTCCTTTTCTTTCTCTCTCTCTTTTTTTTTTGAGACGGAGTCTTGCTCTGTTGCCCAGGCTGGAGTAAAATGGCACAATCTTGGCTCACTGCAACCTCTGCCTTCTGGGTTCAAGCGATTCTCCTGCCTCAGCCTCCCGAGTAGCTGAGACTACAGGCGCCCACCACCACACCCAGCTAATTTTTGTGTTTTTTAGTAGAGACGGGGTTTCACTATGTTGGCCAGGCTGGTCTAGAACTCCTGACCTCAAGTGATCTGCCCGCCTCGGCCTCCCAAAGTGCTGGGATTGCAGGCGTGAGACACTGCACCCGGACAATTTTCCTTTTCTTACAAGAACACTGCTCACACTGCATTCAGGGCCAACCCTAACCCAGTATCGCCTCATCCTGGTTTGATTATATCGGCACAGACCTTGCTTCCGAGCGAGGCCACTTTCTCAGGTACTGGTGGACATGAGTCTTCGGAGACGCTGCTCAACCCACAGTGCTCCTCCAGCTTGGTTTCTGTGACTTGCCTTCCCCAGAGGAGGGGTGCCCTGAGAGGTCTCCACTCCCTGACCGGCTCCTTGGTGCCGCGCACTCTGAGAGGCTTCCCAGGGAACAGAGCACACAGGACCGCCCTCCTGGGTAGACCAATCAGCATCTGAGCTCACAATTTCCCAGCAGGGCAGTGGGGTGGAGAGAGAAGCCTGGGCTGGGCTGGGCTGGGCTGGGCTGGGGAAGCTTCTCCGGGCGGGGGGACGTCAGAGCAGGATCTGGGGCTGATAAAAGCCCGCCCCTGGGTGGGGGCTGAGTGGTGCGGAAGCTGAGCCCGACACGTGGGGATGGAGGACAGGCTGTGGGAGGGTGTGAACCGGATACTGCTTGAAGGGGTGCTGGGGACTTTGAGAGAGGGCGGCTGGCCCTGTCTGGTCGGGGATGCTGGCCCAGACACAGGCCATGGCTGGGATGGGGTTCAGAAACAGGACCGCTGTCTCTCCCGGGCCAGGGCCCTCCCCAGCTGCTCCTGGCTTTCTGGTTCTTGGGGTCAGGGGCAGGCCTGTGCCATGACCCCGCCACTGAGGCTGTGAGGAGGCTGTCGGTGCCCAAGGGCACCAAGGCACACCCCTACTCTTGCACCCCATGTGTGGGCCCGAGCACCTGCTCTGCTGCCCCAAAGATCTGGCGATGTTTCCCAGGCAACTGTCTCTCACAGCCTGTCTGCCTGGCACTCCCGTATCCCATAAATGCCACCACATCTGGCTATGGGTGGGCGTGCCTGCCTGGCATCCACGGGCCAGCAGGTGTGGTGGAGCACAGCCCAGTTCCTGGCTGCGTCAGAAGGCTGCCCGGGCCTTTTGGCTGTCCTTGCCAGCAGCAAAACTCCGTCACCACAGCAGCAGATGGCTCCGAAGAAGTGGAGCGTTTTCATCAGGTTCAACTTTGAAACCTCCACCATCACCATCACCAGCACCGCTGTGTCATGCTGATAACTTGAGGACAGGCAGGACAAGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTCTGTCTCTGTGTTGTGATGAAA +>ENST00000476803 +GCCCCAGGCCCTCCCGGGTCTCCCCACCATAGCGTTTCCGCTACTGAGTACCCCCTGTCTGCCCTCTCTGTCTGCCCCAGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTC +>ENST00000440825 +CGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGAAGCAAAAACAGCTCGGGAATGCGAAGGCACCGGAGTCCAAAGTTGGCAGCCAACAACAACAACAACAAAAGAAAAGGCCGGGCACGGTGGCTCACGCCTGTAATCCCAGCCCTTTGAGAGGCTGAGGCAGGTGGGTTGCTGGAGCCCAGGAGTTTGAGACCAGCCTGGGCAACATGGCAAGATCCCATCTTTACATGCCTGGGCGTGGTGGCGCGTGCCTGTGGTCCTAGCTACTCTGGAGGCTGAAGTGGGAGGATTCCCTTGAGCCAGGAATTGGAGGCTGTAGTGAAGTATGATTGCACCACTGCACTCCAGCCTGGGTGACAGAGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGC +>ENST00000420515 +TGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGAAGCAAAAACAGCTCGGGAATGCGAAGGCACCGGAGTCCAAAGTTGGCAGCCAACAACAACAACAACAAAAGAAAAGGCCGGGCACGGTGGCTCACGCCTGTAATCCCAGCCCTTTGAGAGGCTGAGGCAGGTGGGTTGCTGGAGCCCAGGAGTTTGAGACCAGCCTGGGCAACATGGCAAGATCCCATCTTTACATGCCTGGGCGTGGTGGCGCGTGCCTGTGGTCCTAGCTACTCTGGAGGCTGAAGTGGGAGGATTCCCTTGAGCCAGGAATTGGAGGCTGTAGTGAAGTATGATTGCACCACTGCACTCCAGCCTGGGTGACAGAGTAAGACCCTGAATCACGGACAGAGGGTACTGTTGGGAGCCCTGGGGAGAAATCCATGCTCTTGGCTGAAGCTCTGAGATCCTTGTTGCTGTCAGGGTGCTGCCCCCCGCCCCCCGGGGAGGGGCTTTTGTCTTTGCATCGCCTGCTTTTCCAGATAGTCTAAAAAAAGACTTCTGAAGACAAGGACGTTCACGAGGAAAAACTTGCCATTTTGAGCTTTTTAAGCAGTTGCTGAAAGCTTGGCAGACTGCCTCAATTTTTCCTAAGTAGGCGTCAATGAAGTCAGGTCCAGGCCTTGGTGTGTCTGGAATGCTTCAAGCACATTCGAACACTTGATCGTAAGGGAGAGCCGGTACTTTGGAACCGGAACTCACCCGAGGCTGTGGCCACCGCATGGGCAGGCTAGCTGGGGGACAAGCCCCATATCTTTGGGAACAAGGGTTTGCACAGCCACCCTGGGATGCCCTGGGACTCCTGACCGCACAGGACCCCAGCAGGGAGGCCGCCTGGATTGGAGGGTCTGGTCTAACAGCCGGACTTGGTCTTGAACCGTCGCCCTGTCCCGCACAGGCGCCTGCTGAGCCTGGAGCCCTGGCAGAGGCGGGTCTGGGGAGTGGAGCTGCCAGGAGGCCTCCCATTTCTCACAGCCTTGGTGTTCTCCGGGTCACCCAGAGGACCGTCAAATGCTGGATTTGACAAACTATGTAGAATGTTCTTTGTGTCTTTAAGATCTTCTTGTGGTCCTA +>ENST00000514625 +CCGCTCACTGTCATGACAAGTGGACAGATGCCCCGGGCCTCAGTTGACCCATCTGTAAGTGGGGCCACGCGACAGCACCTCTGTCACAGGGCTGGGTGTGGGGTGAACAGGCTGGTCCCTGGAGGCAAGTAGTGTGGTGCCCTGAGGCCTGAGGCCAGGCTCCAGGACCGCTCAAGGAACAGGGGATTTGAGGCAACTCAGAGAGGACAGGCCCAGCAGCCGGCCCCAGCCTGATATCTTCCCTCCGCTCAGGCCCCAGACGCAGCTGCATCCTGGAGTCCTTCTGAGAAATGTGGGACCTGCCCCAGCTCCACCCCAGGTGAGGGGCACCAGCCAGCTCCAGAGCTGCCTACCTTCCCTGTCAGGTGCACAGGTCAGCGCCAGGCCAACCCCAGAGCGAGAACACCTGTGCTGGACTGAGCTGGAGCAGCAGGGTGGCCTGCACCGGGGCAGCGAGGGAGGCGTTGGATGGAGCCACCCCACGGCTCCTCTGTGAAGGTCTGCACGTCACTCAGAAAGTTGAAGCAAACCAAGCAGGGTTGGAGCCCACAGTTCACAGCCGGCTGCACAGGGGATGCACCAAGCACAGTTTCCTATGACAAGTGGAAACCTGTGCGCCACAGCAAAACTCCGTCACCACAGCAGCAGATGGCTCCGAAGAAGTGGAGCGTTTTCATCAGGTTCAACTTTGAAACCTCCACCA +>ENST00000420964 +CCTTTCCTGCCGCCCAGGCCTTGGAGAGATCCAAGGCCTGTGGGCCACGGCTGCGCCTCTCCTGACTCCAGCTTGCCCGTCTGTCCTTGGGGGCAGCGTCCTTCCTTCTCTCGGCCCCTTGGAGCAGCTCTGCGGGAACCCCACAGCAGCCCAGCGGATTGAACGCAAAAGACAGCCACCCTCCTGCTCCGGATCCTGGGAGGAGGCTACACGCTGGCGCTGAGACAGCAACCTGCCTGGCCTGGGAAGCCCCCCGCAGCCCCTACATCAGAAGCTTGCTCTTGGCGCAGTGGCTCACGCCTGTAATCCCAGCA +>ENST00000378322 +GCGCCCAGGGGTCCCGCGGGTTTTCGGGCGCAGGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTGGCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAGGTCTGGTCTTTAGAGCAGCCCGAATGGCACTGCAAAATAGACGAGGGCTCAGCCGGGCTGGTGGCCTCGTGCTGGAGCCCGGACGGGCGCCACATTCTCAACACCACGGAATTCCATCTGCGGATAACCGTCTGGTCCTTGTGCACAAAATCCGTGTCTTACATCAAATACCCGAAAGCTTGTCTGCAGGGAATCACCTTCACCAGGGACGGCCGCTACATGGCGCTGGCAGAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGCATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATATGAGATCGCCTCTGTCCCAGTCTCCTTACAGACACTGAAACCTGTTACCGACAGAGCAAACCCGAAAATCGGCATAGGAATGCTGGCATTTAGTCCTGACAGCTACTTCCTGGCGACAAGGAACGACAACATTCCCAATGCCGTCTGGGTCTGGGACATTCAGAAGCTGAGGCTGTTCGCGGTGCTCGAGCAGCTGTCCCCAGTGCGCGCATTTCAGTGGGACCCGCAGCAGCCGCGGCTGGCCATCTGCACGGGAGGCAGCAGGCTCTACCTGTGGTCCCCAGCGGGCTGCATGTCGGTGCAGGTGCCTGGGGAAGGTAAGCACATCCCCGAGGCCACGGACGTGGCAGCCTTGCTGTGTGCAGTCTGGCATCACACGGGCTGAACTGTTGAAGCCCAGCTGCTGTCTCCGGCAGCACTCCAGGGAAACTGCCCTCAGAGTCTTTGCGTAAACCTCAAGACGGACACACAGGGGACCCGCTGCCCTCAGCTTTATGGGCTAGAAGCAGCCTCTCCCTGACTTGAGGCAGCTCTGGGGCTCCACCCTGGCTCTGCCTATGTGGGTCACTCCAGGCACTGTGCTGGCCTGCAGGACAAGGGGGTGCCCATCCCCCAGAATCTGGGCCTCCCCTGCTGTAATCCTCTGGCCACCTGTCTCTCTCTAGGCGACTTTGCAGTGCTCTCTCTGTGCTGGCATTTAAGCGGAGACTCGATGGCCCTCCTCAGCAAGGATCACTTCTGCCTCTGCTTCCTGGAGACAGAGGCAGTGGTCGGCACAGCCTGCAGACAGCTGGGCGGCCACACGTAGCAGCGGTGCACTAACGTGTGCAGAAACAGGGCTACTCTGTGTTTCCAGTGTGGGAAAAAACACAGCTTCACCAGGAGGTTCTCCACTGTGGTGGTCTGGATTCAGTGATTGATTCTATTTTTCTATAGCAAAGCATTTTTGTAAATATGTATGGTATAAAACTGTAGTTTTATTATTTAAAATAAATACTTGCTGATTTATACAACTA +>ENST00000270708 +GTTGCAGCCTGCTGCGCGCCCAGGGGTCCCGCGGGTTTTCGGGCGCAGGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTGGCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAGGTCTGGTCTTTAGAGCAGCCCGAATGGCACTGCAAAATAGACGAGGGCTCAGCCGGGCTGGTGGCCTCGTGCTGGAGCCCGGACGGGCGCCACATTCTCAACACCACGGAATTCCATCTGCGGATAACCGTCTGGTCCTTGTGCACAAAATCCGTGTCTTACATCAAATACCCGAAAGCTTGTCTGCAGGGAATCACCTTCACCAGGGACGGCCGCTACATGGCGCTGGCAGAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGCATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATATGAGATCGCCTCTGTCCCAGTCTCCTTACAGACACTGAAACCTGTTACCGACAGAGCAAACCCGAAAATCGGCATAGGAATGCTGGCATTTAGTCCTGACAGCTACTTCCTGGCGACAAGGAACGACAACATTCCCAATGCCGTCTGGGTCTGGGACATTCAGAAGCTGAGGCTGTTCGCGGTGCTCGAGCAGCTGTCCCCAGTGCGCGCATTTCAGTGGGACCCGCAGCAGCCGCGGCTGGCCATCTGCACGGGAGGCAGCAGGCTCTACCTGTGGTCCCCAGCGGGCTGCATGTCGGTGCAGGTGCCTGGGGAAGGCGACTTTGCAGTGCTCTCTCTGTGCTGGCATTTAAGCGGAGACTCGATGGCCCTCCTCAGCAAGGATCACTTCTGCCTCTGCTTCCTGGAGACAGAGGCAGTGGTCGGCACAGCCTGCAGACAGCTGGGCGGCCACACGTAGCAGCGGTGCACTAACGTGTGCAGAAACAGGGCTACTCTGTGTTTCCAGTGTGGGAAAAAACACAGCTTCACCAGGAGGTTCTCCACTGTGGTGGTCTGGATTCAGTGATTGATTCTATTTTTCTATAGCAAAGCATTTTTGTAAATATGTATGGTATAAAACTGTAGTTTTATTATTTAAAATAAATACTTGCTGATTTATACAACTA +>ENST00000471223 +GTGGGAAGCAAGATGATTCCCTGGTAGGCTCCACGGGGTCTCAGTGGGAAATGCAGGTGGAGGGACACAGCAGCCCTGGAAGTCCCGCGGCGCTGCCACGGGGAGGGCTGGACCACCCACTGCGGTGCCTCTCCCTCAGCAGGCACGCCCTCGTCGGCCTGGTTAGAAAATCATCTTTTGGCCTCACTGTGCCAGCCTAGTCAGCTCTCAGCTCCCTGAGTCAGGGAAAGGGGTGGAAAAGTGGACAGTCCAGCAGCGCATGTTCTAGAACCCTCTGCAGATGCAGCCAGGCCAGCGAGCACACGCAGGAGGCAGACGGACACCTTCTTGGGTGTTGAGTGGCTGCTCCTGCCTCAGGGCTGCAGATGCAGGCTCACAGCCCCCTGGTGAGTCCCGGAGTGGCTGCATCCAATCTCCAGATCCTCTGTCTTCCCATAAAGGAGACTGAACCCGTGGTGGTTTCTAGATCAAGATTTTTCTCTGAGTAACTCAGGGTTATTATAACATGCAACCTATGGTCACTTTGAAAAAGCTAATGAAAAAGCACTTGGATTTAACTTTGTGTCACTCAATTTTGGTATAAAACAACAACAACAGAAAACCAAGAACACCAAATTTACCGTAACCACAGTAAAATACGCATTTGAATATTCCGGTAGGAGGGCAGGCATCCCCCAGGTCCTGATAGATCCACTCCAGCAGTCAGGCCTGTGCTTGGGGACGCGTGGGCGGGTTGAGGATTGAGACGGTCTCTGATGATGCTAAAGAAGTGTTTCCTTTCTCTTTCCCCTTTCCCCCAACAGCTGCGGATAACCGTCTGGTCCTTGTGCACAAAATCCGTGTCTTACATCAAATACCCGAAAGCTTGTCTGCAGGGAATCACCTTCACCAGGGACGGCCGCTACATGGCGCTGGCAGAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGGTAAGGCGTCCCCCAGACTGGAATAAAGTTGTCCTGCTGACTGTGGAGGGATCGAGTGAAGTAGATCCTTCCAGATTCCAGGGGATCTTTGGTAGGATATGGAGCAAGGTGATGTTGTATTAACAAAGGGCAGGTGCGCTGCGAATCACTTCCAGTGGCACCCGGTTGTGTGTTCAGGAGACTTGGTGAAAAGGACGCGTGCCCAGGTGTTTTAAAAGTGAATATGCTGTCACATTTGAGCCCTTTTCCTTGTCCTGTGTGATGGTGTTTGCGCATGTGTGTGCCACGTCGGGAGTTGGGGGGACGTGGAAGTTCACCTTGACTGAGGGCCTGCATTAGGCAGGGCGCTCTGCCAGGTGCCCAGGCACAGAGGGCACTGCCCCCACAGCAGACATATGAACACGATTCCAGCACAATCCATCATTAAGGTAGAGCAACCTCTGGAATGCTGTCAGAGTGCAGAACCCGGGATCCAGGCAGTGCTCTGGAAGGGACTTGTCTGAGCTGGGTCTAAAGGAGTGAGCCTGGCCAGGCAAGGAAAGGTGAGGGGGAGAGTGTGCACATGAGTGCAGGTGCGGGGAGACCAAGCCACCTTCGGGGGCTGGCCAGGCAAGGAAAGGTGAGGGGGAGAGTGTGCACACGAGTGCAGGCGCGGGGAGACCAAGCCGCCCTCGGGGGCTGGCCAGGCAAGGAAAGGTGAGGGGGAGAGTGTGCACACGAGTGCAGGCGCGGGGAGACCAAGCCGCCCTTGGGGGCTGGCCAGGCACTGACGCTGGCATCTGTGGCGGTGCAGCCCCAGCAGCAGCTCTACAGGGATTTCATGCATTTCCAGGATAGAGCTGTTGAGATTTTGTCAATTTCTATATAAGGAAATTAAGTGCGTTAAGAACATCAGTCATAAATGCAATTATTTATTTACGAAAATATTTTCCAAATTTAATGTTTCCCCCCCTTCCTTTGGAAGCATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAGGTATGAAGATGACCAGGTGACATGTTTGCTTTCGAGAGCTTTTCCCGGAATTTCATGCTTTCTGAATGCTGCAATATAGTTTGCTTTATCTTATTTCAGATAACAAGTTGAGCTTTGTTTTAAAAGACAGGGTCTTGCTCTGTCACCCAGGCTGGAGTGCAGTGGTGTGATCACGGCCCACTGCAGCCTCGACCTCCTGGACTCAAGTGATCCTCCTACCTCAGCCTCCCAAGTAGCTGGGACCACAAGCATGCACCACCACGCCCGGCTAATTTTTGTATTCTTTGTAGAGATGGGGTTTCACCGTGTTGCCCAGACTGCTCTTGAACTTCTGTGTTCAAGTGATCTGCCAGCTTCGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACAGTGCCCGGCCGAGTTGAACTTTTATCAGCGAGCCATTAGGTTGACCTCCCAATTTCCCCTTTTTCCTCATGCTCTCACTGCCTCTCCGTGACTATCTCAGTACTAGCTGGCAGTTCCAGCTTTTCCACGGCCACGCGGACAGTCCTGCCAGCTTTGTGCTATCTGCACCAATGTCACTCTGCAGCACCCGCGTCTGTGGTGTGTTCCTGGCGACGGGGGTGTATTCATTATTAACTGAAATGTCTCATCTGCAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGGGAACCAGTGCAGGGCACTCAGGAAGTCCGACCGCCCAGCGGGCCGGGCCCTGCCTCACCTGTGCATGGTTTCCTTCCTCAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTAAGTCTGGAACACGTGTTTCTGCCTGAGCAGGCTGTTGGGGAGGGCGGTGGGAAACTGCTCCTTCACTTTGCTTTCTTGATTGTGGTTTATTATTTAACCGGGCACTTCCATCACCGTAAACTTGCTACTGTGACATTTCACGCGTCTGGCCCTGCCCTGGCCTTTGTTCTTCCTCCTCCACGCTGCCCAAAGGGTCTGAAGTGGGCCTTGCCCTGGCCTGTCCTCTGCCGCTGCCACCCCAGTCCAGTTTTCTCCTTTGTGGTCTGTCTGGATGCAGATCCCTGTGCTGTACAGAGTGGCCAGGGTCTCCTGCCCCCAAACACTGGGCATCTGCTGTCGTGCCAGGCACTGTGCTCTGGGCCGCAGCCAGAGAAGAAGAGACAGACCCCTGCACTTGCAGAGTGCGGCTGGAGAGACAGGGAAGGGGCTGGAGAGCTGGGTGTCTCCACGGGGTGGCAGGGAGTGGCCACCAGCGAGGGATCGCAGGCACAGATGCTGCACCAGTGATCAGGGACTCGGGGAGGGAGCGTTCCAGGCCAAGGGAACAGGAAATGCAAAGGCCCCGAGGAGTGGGCCACGCATCCATGTGTGCAGCGGGCACTGCGCTGGGAGCCAGAGACAAATGCTGCCCTCCTGGTGTTGACCTGTAACCGACAGAGCTGAGTGAAAGGCGGCTTGGATTCGATGAAGAGGCCAGTGAGTGGCTGGGGCTGCGCATGCCAGATCAGCCACTGCCGGGGATGCATCCTGGAGGGGTGTTTAAGTGAAGACCAGGAGGAGGAGCTGCGCGGTGTCTGGGCAGAAAGGGTGTTTCAGGCAGAGGGGCCTCCTGACGTGGCCAGTGGCTTGTGTGGCTGGAGGCCAGGGTGTCTGGACAGGTGAGCCCGAGCAGGGCTGGCCACACAGGTCCTGAAGGTTTGCCTGTGATTCCTGCATTCTCCAAATCCCTTCGCCACACAGCAGCAGAGCATGCTTTAAAGGCATGAACCAGGCCAGGTGACTCCCTTACCTGGGGCTCTTCAGGGGCGTAGGGGCTGCCCGCCTTCCACTGAGCCTGGGCCGCTGTCCTTTGCTTGCCAGGCTCTCGGGCACAGATGCCCCCACCTCGGGTCTGTGTCTGCTGCTCCCGGGGCCTCTGCTGTGTTGGTGCAAGTGTTCTCTGTATCCTCTTATCACGGAGGGAAGGCTGAGCCCACTCCCTTGCTGGATGATGGTGGCTGCAGTGGTCTCCCGTCTGTAATCACAGGGCACACATTTGCTGCCTGTGTCTCAAAGGGTGGGCTCCTCAGCAGGACACGAGAGAGGGTGGCTGGGTGATCTCAGCTCTCGGGACTGCGGGGTTCGTGCTTCCGTCTCTCCCGGTGGCAGCAGGACCAGCTGTCATGGCAGGCACACCTGTTGACCATGCGCTGTCATGGGCATTTGCCACGTCCATCCTTGGCTTCCGGGTCCCTGTCCTGAGCCGGGCGTGGCCACCTTGTGTCTTTCAGGTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATGTAAGTAGCACATGTGATGTCATTTGTTTTCCTTTTTTAATGCAAGATTCCTCGTTGTCCAGATAAACTTCGGATGTTCCTTATGTTTAAAAAAAAAAACTTTTTTTCCCTTCCATGCTTCCAGCCAGTGTGCCCCTCAGCCTGTTGGCTGGAGGTTGACTAGGGTCTGAATTGCGCAGTGGGCCGTGAAGGTGCGGCTTCTGTTACTGAATATGAGCCCTGGAGACCCGGATCTGACAGCGGGAGCTCCGAGGGGATGTTTTTCCGGAGCTCCGAGAATGATGTTTTTCAAAGAAACACTTTTCCGTGGGTGGCGCTCAGAGTGGGTCTGGAACCCGGCGGTGCTCCCGAGCGCTGTCTCCGGCTTGAGGCCCGGTTCTGATGCAGCCTCTTGACTCTGGGCATTTCCTATGTGTCTGTTTCCTCATCGCTGAAATGGGCATAGTAAAAGCACCCATCCCACAGGGGCATGAGGGCATCTGAAGGTTGCAGGTAGAGGAAGCGGTGCCCCAAGTGCCGACGGGCCCACCCCGGGGCTCGGTGTGTGCTCAGGATGGGGGTCAGGACAGGTGCAGCCTGGCACACAGGAGGCGCTCCCCAGGAGCCCAGGGGCGTCCTTGTTCCACAGCCCCTGCTTCTGCTGTGATGATGGTTCTTCCACAGCCGGAAAGTCTAAGGGTACTGACGCTGAGGTGGAAGGGATTGTGAACTCAGATGCTGGTAGTCGACAGAAAAGTGCTGAGGAGTTGGAGCTGCTGAGATTGCAGCTAGGACCTGTCCATGTCCCTCTCCAGTCAGCCCCTGGCACGTGGGGTCCACCCCCCACCTAGTCGGGCCTGGCAGGTGATGGTGCCACTCTCATCCGGGGCACTTGCGGGCAGGCCCCTCGCTGCGGCTGCCAGGCTTTGCTTAGCTCTTCCTGCCCTTGGGCCGCACTTTCCTCCCCTTTGAACAGAGGAGCTGGGTTCGCGATGCCCGATGCAGGCACAGCAGCCTCTCAGCCGCGTGCGTACTTCCCGAAAGGGTGACAATGGCGTGTTCTTCCTGTTGGTGTTCTAGATGAGATCGCCTCTGTCCCAGTCTCCTTACAGACACTGAAACCTGTTACCGACAGAGCAAACCCGAAAATCGGCATAGGAATGCTGGCATTTAGTCCTGACAGCTACTTCCTGGCGACAAGGAACGGTCAGTTGTGCTGACGCAGGTGCTGTCTCACCCTTTACTGTGTCCTGTGGCCCCAGGTGTAGAAGCGACTGGAAAAGAAAATGAAGTTGGGGGTTTCCGACACGTCACCTCCTTTCACGTTTCTGCAGTAGCCGAGGTGCTCACAGAAGCTCCTTGGAGGCGCTGGGCCTTTGTCCTGCAGCAGCCGCAGGTCCGCGCATGAGTCAGGAGGCCTCCACCCTGCTCACTTGCTCCACTCTGCTGAGTAGAAAGCAGGGCTGGGCACACTGCAGCCCGCCTTTTGTTAAGGGTTTCTCCATTTGTAAAGGGCTAAAAAAAAAAAAAAAA +>ENST00000424367 +GGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTGGCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAGGTCTGGTCTTTAGAGCAGCCCGAATGGCACTGCAAAATAGACGAGGGCTCAGCCGGGCTGGTGGCCTCGTGCTGGAGCCCGGACGGGCGCCACATTCTCAACACCACGGAATTCCATCTGCGGATAACCGTCTGGTCCTTGTGCACAAAATCCGTGTCTTACATCAAATACCCGAAAGCTTGTCTGCAGGGAATCACCTTCACCAGGGACGGCCGCTACATGGCGCTGGCAGAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGCATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATATGAGATCGCCTCTGTCCCAGTCTCCTTACAGACACTGAAACCTGTTACCGACAGAGCAAACCCGAAAATCGGCATAGGAATGCTGGCATTTAGTCCTGACAGCTACTTCCTGGCGACAAGGAACG +>ENST00000497940 +GAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGCATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATGTAAGTAGCACATGTGATGTCATTTGTTTTCCTTTTTTAATGCAAGATTCCTCGTTGTCCAGATAAACTTCGGATGTTCCTTATGTTTAAAAAAAAAAACTTTTTTTCCCTTCCATGCTTCCAGCCAGTGTGCCCCTCAGCCTGTTGGCTGGAGGTTGACTAGGGTCTGAATTGCGCAGTGGGCCGTGAAGGTGCGGCTTCTGTTACTGAATATGAGCCCTGGAGACCCGGATCTGACAGCGGGAGCTCCGAGGGGATGTTTTTCCGGAGCTCCGAGAATGATGTTTTTCAAAGAAACACTTTTCCGTGGGTGGCGCTCAGAGTGGGTCTGGAACCCGGCGGTGCTCCCGAGCGCTGTCTCCGGCTTGAGGCCCGGTTCTGATGCAGCCTCTTGACTCTGGGCATTTCCTATGTGTCTGTTTCCTCATCGCTGAAATGGGCATAGTAAAAGCACCCATCCCACAGGGGCATGAGGGCATCTGAAGGTTGCAGGTAGAGGAAGCGGTGCCCCAAGTGCCGACGGGCCCACCCCGGGGCTCGGTGTGTGCTCAGGATGGGGGTCAGGACAGGTGCAGCCTGGCACACAGGAGGCGCTCCCCAGGAGCCCAGGGGCGTCCTTGTTCCACAGCCCC +>ENST00000469643 +AGTACTAGCTGGCAGTTCCAGCTTTTCCACGGCCACGCGGACAGTCCTGCCAGCTTTGTGCTATCTGCACCAATGTCACTCTGCAGCACCCGCGTCTGTGGTGTGTTCCTGGCGACGGGGGTGTATTCATTATTAACTGAAATGTCTCATCTGCAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATGTAAGTAGCACATGTGATGTCATTTGTTTTCCTTTTTTAATGCAAGATTCCTCGTTGTCCAGATAAACTTCGGATGTTCCTTATGTTT +>ENST00000494884 +CCAGCTTTTCCACGGCCACGCGGACAGTCCTGCCAGCTTTGTGCTATCTGCACCAATGTCACTCTGCAGCACCCGCGTCTGTGGTGTGTTCCTGGCGACGGGGGTGTATTCATTATTAACTGAAATGTCTCATCTGCAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTAAGTCTGGAACACGTGTTTCTGCCTGAGCAGGCTGTTGGGGAGGGCGGTGGGAAACTGCTCCTTCACTTTGCTTTCTTG +>ENST00000465916 +TCCCCGATCGCTCTCCCCTCACCTCCCAGCTTCGGAGCTGCGAGCCCAGGCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAGGTCTGGTCTTTAGAGCAGCCCGAATGGCACTGCAAAATAGACGAGGGCTCAGCCGGGCTGGTGGCCTCGTGCTGGAGCCCGGACGGGCGCCACATTCTCAACACCACGGAATTCCATCTGCGGATAACCGTCTGGTCCTTGTGCACAAAATCCGTGTCTTACATCAAATACCCGAAAGCTTGTCTGCAGGGAATCACCTTCACCAGGGACGGCCGCTACATGGCGCTGGCAGAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGCATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCA +>ENST00000419924 +GCTGCGCGCCCAGGGGTCCCGCGGGTTTTCGGGCGCAGGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTGGCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAGGTCTGGTCTTTAGAGCAGCCCGAATGGCACTGCAAAATAGACGAGGGCTCAGCCGGGCTGGTGGCCTCGTGCTGGAGCCCGGACGGGCGCCACATTCTCAACACCACGGAATTCCATCTGCGGATAACCGTCTGGTCCTTGTGCACAAAATCCGTGTCTTACATCAAATACCCGAAAGCTTGTCTGCAGGGAATCACCTTCACCAGGGACGGCCGCTACATGGCGCTGGCAGAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGTACAAGATTCTGCTGTACTCATT +>ENST00000479331 +TGCGCGCCCAGGGGTCCCGCGGGTTTTCGGGCGCAGGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTGGCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAGGTGTGTGCTGCCGTGTCGCTTAGAATCTGGACACCTTCTGAGGGCCCCTGGGAAGGAGGGGTTTTGTTCTGTGCCTTTCTAGTTTGAAAAAAAAGTCCGTGCAGCTCAAAGCCAGTTTTCTTTTGAAATTATAACGTTCTCTAAAGTTTAAGAACATTTAAA +>ENST00000377837 +CGCGGGGACACTCGTGCGACTGGGGCAAGGTGCCCAGGGGCTTCTCTCCTAATTTGCCTCACGTAACAGTTGAGACCCCAGAGGGCAGCAAAACTGGGTTCGAATTGGAGAGCCGTCCAGGCACAGACAAATTCATTCATCTGCCCAGTGCCCGCTAACTGCGGTTCCAGGCGCCGGCGACGCAATTCCAGAGCTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAGAGCCTGAAGCCGCTGCTGGAGAAGCGCCGGCGCGCGCGCATCAACCAGAGCCTGAGCCAGCTTAAGGGGCTCATCCTGCCGCTGCTGGGCCGGGAGGATGCTTCTGGCTGGCACACCTGGCTTCCCCTCCATGCTCAGAACTGCTTCCTACTCTACATCCAGGCTCCTGAGCAGCCCCCAGCTTAAGCTTCAGCAGCTCCAGGGTAAATCCATCTCCGCCCAGAGCTGACTCCGGATCTGCCCCAGTGACAATAACAAGATAAATGCCTTCCATTCTCTTCGTACTTACAGGATGTAATCCACATATTTACACAGTGTTTCATTTGCGGTAATGTTTGTTTTGTTTCTTGTTCCTTCGTACCTATCTGGGAAGCCTGTGCAATTCAGATGTCCAGGCCCACTTCCAGAAGTTCTCATTCCCTGTGCTTGAGTCAATGGCCGCAGACCATACACCTGAGAGCAAGTTAATCTGCTCTAACAAAGATATCACATCTAAGAATGGTGGTTGGCAGGGGCTGGGGGGTGGGAAGAATGGGGAGTTGGTGCTTCATGGGTACAGAGATTCAGTTTTGCAAGAGGAAAAGAGCTCTGGAGATGGATGCTGCTGATGGCTACACCGCAATGTGAATGTGCATGATGCTTAAATATGGTTAAGATGGGCCGGGCGCGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAGGCGGGCAGATCACGAGGTCAGGAGATCGAGACCATCTTGGCTAACACGGTGAAACCCCATCTCTACTATAAATACAAAAAATTAGCCGGGCGTGGGGGCGGGCACCTGTGGTCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATGGCATGAACCTGGGAGGTGGAGCTTGCAGTGAGCCGAGATCACGCCACTGCACTCCAGGCTGGGCGACAGAGCGAGACTCCGTCTCAAAAAAAAAAAAAAAAAAAAAA +>ENST00000377836 +CCCGGGCCGCGCCCGGGACCTCATTTCGGACCTCGGTTTCCCTTTGCGTGGGGCTCGCAGCTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAGAGCCTGAAGCCGCTGCTGGAGAAGCGCCGGCGCGCGCGCATCAACCAGAGCCTGAGCCAGCTTAAGGGGCTCATCCTGCCGCTGCTGGGCCGGGAGGATGCTTCTGGCTGGCACACCTGGCTTCCCCTCCATGCTCAGAACTGCTTCCTACTCTACATCCAGGCTCCTGAGCAGCCCCCAGCTTAAGCTTCAGCAGCTCCAGGGTAAATCCATCTCCGCCCAGAGCTGACTCCGGATCTGCCCCAGTGACAATAACAAGATAAATGCCTTCCATTCTCTTCGTACTTACAGGATGTAATCCACATATTTACACAGTGTTTCATTTGCGGTAATGTTTGTTTTGTTTCTTGTTCCTTCGTACCTATCTGGGAAGCCTGTG +>ENST00000471190 +TGACTTGCATTGACCTGGCTCCAATCAAGCTACAACTCAAGCAGTCACGGGGAGAAGGATTGTAGATGGGCCAGTGACTCACAGGGTCAGGCACTCGGGGGAGCCTGAGTCAGGAGGATGCTTCTGGCTGGCACACCTGGCTTCCCCTCCATGCTCAGAACTGCTTCCTACTCTACATCCAGGCTCCTGAGCAGCCCCCAGCTTAAGCTTCAGCAGCTCCAGGGTAAATCCATCTCCGCCCAGAGCTGACTCCGGATCTGCCCCAGTGACAATAACAAGATAAATGCCTTCCATTCTCTTCGTACTTACAGGATGTAATCCACATATTTACACAGTGTTTCATTTGCGG +>ENST00000377834 +ACTCGTCTGGCACCAGCCCGGGCCGCGCCCGGGACCTCATTTCGGACCTCGGTTTCCCTTTGCGTGGGGCTCGCAGCTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAGAGCCTGAAGCCGCTGCTGGAGAAGCGCCGGCGCGCGCGCATCAACCAGAGCCTGAGCCAGCTTAAGGGGCTCATCCTGCCGCTGCTGGGCCGGGAGAACTCCAACTGCTCGAAGCTAGAGAAGGCAGACGTCCTGGAAATGACCGTGCGCTTCCTGCAGGAGCTGCCTGCGTCCTCATGGCCCACGGCAGCGCCCCTGCCTTGCGACAGCTACCGCGAGGGCTACAGCGCCTGTGTGGCGCGCCTGGCCCGCGTGCTGCCCGCCTGCCGTGTCCTGGAGCCCGCCGTGAGCGCGCGCCTGCTGGAGCACCTGTGGCGGAGAGCGGCCAGCGCCACCCTGGACGGCGGGCGCGCTGGGGATTCCAGTGGCCCGTCTGCCCCCGCCCCAGCGCCCGCGTCTGCCCCAGAGCCCGCATCCGCTCCGGTGCCCTCGCCGCCCTCGCCTCCCTGCGGCCCTGGCCTCTGGCGGCCGTGGTAGCCCCTCGGCCGATCCACAGACCCTGCCGACTGCTTGGGACCTTGGGGCACTGGACAGGTTGAAGCTCTTGGTGGCGGCTGCTGTTCCCATCATTAGGGGCCAGCCCAGTACCCACACCCAGGCCGGAAGCCGGCTGTTTGTGACTGGCGTGGCAGACTGAAAGCCCTGGGGCTGGGGCTCGGCTCAGGGAATAAAAGGAGCGTCCCTGCTTCACCCCCAACTTGGCTGGAGAAGAAAGGACAAGAGGCAGCAGGGTGAAGAAGAAGCCCCCCATCCCAGCTGGTGGAGATAGTTCTGGAACTGGACCCCGCAGCTGCGTGGGCAGCCGACACACCCACCCCAGCACTGGCACCAGACCAGAGCCAGAGCCAGGACCTGGGCAAAGTGCAGCCGTGCACCCTGCCTGGTCACTGCTCTCCCAGCCCTGCCTGGGCCTACCTCCTGCCCAGCTCTGCTTGGGACCCTCTGGGCATGCAGCAGCAGTAGCCTAAGGGCTCTGGTCACTTCCAGGGCTCTACAGGGCAGCAGAGCAGAGCAAAAGGGTGCATATGCTGGGAGCTGTCACCTCCACTCCTAGGCTTTTCTGCCTAGAGCAGAATTATAGGGGCAGTATACATCCAGGGGTCTGTGCGGTGGGGCTGGGGGATTCCTTAAGTGACTTTGGGAAGGATTTGTTTTCCCGAGCATCAATTTCACACCTGGGCATTGCACCCCAGGCTATGCAGTCTTTCAGTGTGAGGAAGGGGCAGAACAAGAATGAGGCGGCCCCGTGGCCTCAAGGAAGCTTGTGGCTTTGGAGGATCTGACTCCAGCAGAGTCTGTGCCAATGTGGGGTGAGCAGGGCCCCTGCCATGGAGCAGCAGGAATTTGAGGGATGGAGCAGGTTAAAGAATGGGAAACATCTTCACTTGTTTTTTTTTCTTGCAAACTACTCCCTGCTACTCATTGAGACTGGTTACTGGAAGCAACTTGTTAAGATTTTTCTTTCTGGGCGGGCGCGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCAAGGCGGGTGGATCACCTGAGGTCAGGAGTTCGAGACCAGCTTAGCCAATATGGTGAAACCCCGTCTCTACTAAAAATACAAAAATTAGCCGGGTGTGGTGGCATGTGCCAGCTACTCGGGAGGCTGAGGCAAGAGAATCACTTGAACCTCGGAGGCTGAAGTTGCAGTGAGCCAAGATTGAGCCATTGCTCTCCAGCCTGGGTGACACAGCAAGACTCTGTCTCAAAAAAAATTTTTTATTTCTTTCTTTTCCATGGAGGCCTAGAGTCCCTGTGAAGGCTAGGAAGGGGCTGCTGATCCCAGGAGTGCCCACGAGGAGTGGGGGGCACTGTTGGCCCATAATCAGGCAAACACCCATCATTTCATGGGGGATTCATGAAATCATAGTCAGGCAAACACCCGTCATTTCATGGCTAAGCATTTGCAGAAGGTGGAGGATTCTCCCCCGAGTCCCCAAATCAGCAGCCTGTGCTAGGGACCAGAGCACCGGGGGCAAGAAGACAGAACCAATGTGGGAGTGGGGATGGTCACTAAATCTGACTGTGCCACACAAGCCCATGATGACCTTGGCACTGGTTTGGGTGGCAGGATATGAAGGAAGCTGTAGGCATTATTGAAAAAATCATTGTTCAGCCAACAGGGTGAGGCTCCCAGCAAGGCCGTGCCATCTTCCCACCTCCCTGTGCCCAGAGGGTTAGACTGTAAGCTCCCGGAGGGCGAGGCTGGGGCTGAGCGTGCCTCCACGTCCCCAAGGCACAGGGTGCACAGTGGGTGCTCACTGAATATAGTGGACTAGTGAGCAGAGGATGAGAGGACTACCCTGTAATGAGCCTTGGACAGTCTGGCATTTGCCTTAACTCCCACTCCCATGCCCTGGGATCACTGTTGGATATTTACTCCATGAGGACAAATACTGGGGAGGTGTGGAGAGGAGGGAGGGCAGGTTCCTCTTACTTTCACCCATTGCTGAGAATGAGCGCCTGTTGGCACTGCCTTTGTGAGCCTCCGGGAGCAGGTAACCTGCGGCCCAAGCCCGCCTAGGACTCCACATCAGGCAGGCACAGGACTGGCCCCTTGTCCTCATAAAAACTCTCAGTACAGCTTAAACTCTGTAAGATCTAACCAGCCAGGAGGACCCTCGCTTCCTCTCCGCCATGCTTGCCACCTCTTGCTTCTGAGAGTCCATCTCAGTTCGCAGTTCTGTGACTTGCATTGACCTGGCTCCAATCAAGCTACAACTCAAGCAGTCACGGGGAGAAGGATTGTAGATGGGCCAGTGACTCACAGGGTCAGGCACTCGGGGGAGCCTGAGTCAGGAGGTCAGTGGGCCCTGGAAGGGAGGGGGCAAGCCTGGGTGGGTAAGGTTCTGGGCCCCAGGCAAGAAGGCAGAGTTTCTCCGCAGGGGTGTGTGCAAGAGCTAGCTGCGCAGAAGGTCTCCGCTGGCTCTCCAAGCCGGGCTTGTGAAATAGGAACGCCAACATCCTCCTCCACAGGCAGTGGCAGGCACCTCCTCCTCAGGTGCCCCCCAAGCCCTATCTGATGGGCAAAGGTGAACGCAGGGCGGTGGGCTTTTCCTGTGCAGAGGGAGACTGATTCAAAGGGTCATTTATGACCTTTCACAAGTCCCACATCCTGCCCAATGGCCAGGTCTTGGGATGCTGTTGCAAGATGGTTCTGTGACTCCATGTGACTGTCTGATGATTGCCCCAGCTGGGGAAAAGGCTCCCATGTCTCTTTCTCATAAAACCAGTGGGCAAGGCCGGGCGCAGTGGCTCACGTCTGTAATGCCAGCACTTCGGGAGACCAAGGTGGGCGGATCACCTGAGGTCAGGAGTTCAAGACCAGCCTGACCAACATGGTGAAACCCCGTCTCTACAAAAATATGGAAATTAGCTGGGCATGACGGCGGGTGCCTGTAACCCCAGCTACTTGGGAGGCTGAGGAGGGATAATCAGTTGAACCCAGGAGGTGGAGGTTGCAGTGAGCCGAGATCGCGCCACTGCACTCCAGCCTGGGTGACAGAGCAAGACTCCATCTCAAAAACAAACAAACAAAAAACTAGCGGGTGAAATGATTCAGTGACCTAAGGACAGCCAGAGCACTAAGCTGCTGGGAACCCATCTGTGCTGAAATGTAGATTTCCCAGGAAACTCAGGCTTGGGACAGGCGCCTACCTGCTCCTCGGGCACCAGGTGATTAGGAGAGGTCGAATCTCATTTCCACGTGAGTGAGGATAAAGACTGGGCTGCCAAGGAGGACTCCTCATAAACATTGACAAATTGCTCTGCCCCGCCTGTGATCCCAGACGACTCCTGCAGTCTGGGATCCTGAGTGTCCTGTGGGTTCATCTCGGATGGGCGCTGCATAAACAGCCTGCAGGGAACGTCTGGGAGAACCAGCTTCACAACAGATATAATAAGGAAGAAGTTTGAAATATTGCAAGAATTGCGAAAGTGTGACACACAGATACAAAGTGGGCACATGCTCGTGGGAAAATGTTGCCAATAGACTTGCTTGACTCTGGAGTTACCCCGAACCTTCAATTTGTTTAAAAAAAAAAAAAGGCAATATCTTGACGTGCAATAAAGTGAACTGCAATAAAA +>ENST00000487437 +CCAGCCCGGGCCGCGCCCGGGACCTCATTTCGGACCTCGGTTTCCCTTTGCGTGGGGCTCGCAGCTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAGAGCCTGAAGCCGCTGCTGGAGAAGCGCCGGCGCGCGCGCATCAACCAGAGCCTGAGCCAGCTTAAGGGGCTCATCCTGCCGCTGCTGGGCCGGGAGTGCCTTGCGACAGCTACCGCGAGGGCTACAGCGCCTGTGTGGCGCGCCTGGCCCGCGTGCTGCCCGCCTGCCGTGTCCTGGAGCCCGCCGTGAGCGCGCGCCTGCTGGAGCACCTGTGGCGGAGAGCGGCCAGCGCCACCCTGGACGGCGGGCGCGCTGGGGATTCCAGTGGCCCGTCTGCCCCCGCCCCAGCGCCCGCGTCTGCCCCAGAGCCCGCATCCGCTCCGGTGCCCTCGCCGCCCTCGCCTCCCTGCGGCCCTGGCCTCTGGCGGCCGTGGTAGCCCCTCGGCCGATCCACAGACCCTGCCGACTGCTTGGGACCTTGGGGCACTGGACAGGTTGAAGCTCTTGGTGGCGGCTGCTGTTCCCATCATTAGGGGCCAGCCCAGTACCCACACCCAGGCCGGAAGCCGGCTGTTTGTGACTGGCGTGGCAGACTGAAAGCCCTGGGGCTGGGGCTCGGCTCAGGGAATAAAAGGAGCGTCCCTGCTTCACCCCCAACTTGGCTGGAGAAGAAAGGACAAGAGGCAGCAGGGTGAAGAAGAAGCCCCCCATCCCAGCTGGTGGAGATAGTTCTGGAACTGGACCCCGCAGCTGCGTGGGCAGCCGACACACCCACCCCAGCACTGGCACCAGACCAGAGCCAGAGCCAGGACCTGGGCAAAGTGCAGCCGTGCACCCTGCCTGGTCACTGCTCTCCCAGCCCTGCCTGGGCCTACCTCCTGCCCAGCTCTGCTTGG +>ENST00000489730 +TCGTCTGGCACCAGCCCGGGCCGCGCCCGGGACCTCATTTCGGACCTCGGTTTCCCTTTGCGTGGGGCTCGCAGCTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAGAGCCTGAAGCCGCTGCTGGAGAAGCGCCGGCGCGCGCGCATCAACCAGAGCCTGAGCCAGCTTAAGGGGCTCATCCTGCCGCTGCTGGGCCGGGAGAACTCCAACTGCTCGAAGCTAGAGAAGGCAGACGTCCTGGAAATGACCGTGCGCTTCCTGCAGGAGCTGCCTGCGTCCTCATGGCCCACGGCAGCGCCCCGTGAGTGAGCCCTCCCTGCCCTGCCGCGCGCTCTGCACCCCGCACCCGGCACCCTACCCCGCGCCTCACGCGGCTCTCCGCCCGCAGTGCCTTGCGACAGCTACCGCGAGGGCTACAGCGCCTGTGTGGCGCGCCTGGCCCGCGTGCTGCCCGCCTGCCGTGTCCTGGAGCCCGCCGTGAGCGCGCGCCTGCTGGAGCACCTGTGGCGGAGAGCGGCCAGCGCCACCCTGGACGGCGGGCGCGCTGGGGATTCCAGTGGCCCGTCTGCCCCCGCCCCAGCGCCCGCGTCTGCCCCAGAGCCCGCATCCGCTCCGGTGCCCTCGCCGCCCTCGCCTCCCTGCGGCCCTGGCCTCTGGCGGCCGTGGTAGCCCCTCGGCCGATCCACAGACCCT +>ENST00000635687 +GACCCCTCCCCCGCACCGACGTGATTCGGATCGCGCGGTGCTGGCGCCGCCTTCATGCGCCCTGCCTGGCCCCCACCTGGTCCTCTTTCCTTTTCAGGTGGAGGAGATGCCGCTGTCCCGTCGGTCTGGGGACAGCCCAGCTCCCCGGATCCCGGGCTGGAGAGACGCGTCGCGGCCCCGGGGCCTGGTGGCACGAGCAGGAAGGAGGACCCGGCGGCGGGCTCTGCCTGGGCTTGCCTGGGCTTGTTCCGAGCCGGGCTGCTTCTCGGTGACCACGCAGATCGGGGGCATTTGGAGATTTTGCGGGAGTCCTGCAGCCAAGCTCCGGGGCAGGAGAGGCCTGGAAGCCTGCACTACCTGCTCGCCCCGTCCCAGCATGCACCCAGGTGCTGGGGAGAGGCAGGACAGGCCTGTCCCCCGAGTCCCCTCCGGATGCCGTGGACCGGCCAGCTGTGAGTGTTTCTTTGGCAGTGTCTTAGCTGGTTGTTGTGAGCAATAGTAAGGAAGCAATCAGCAAGTATACTGCCCTAGAAGTGCTGCACGTTGTGGGGCCCAAGAGGGAAGATGAAGCGAGAGATGCCCAGACCAGTGGGAGACGCCAGGACTTCGGAAGCTCTTCTGCGCCACGGTGGGTGGTGAGGGCGGCTGGGAAAGTGAGCTCCAGGGCCCCAGGAGCAGCCTGCTCGTGGGTGCGGAAGGAAAAAGGCACAGGGGCTTGGTGTGGGCGGCTTTTGGCTGGGAGAAGTTTGCACGTAGGGAGAATAGTAGCCAGTGTTTGCAGAGCACTTACTATGCAGGAAGGCCTGTCCTAAGTATTGTAAGTGTATTACATCATGTACAAGTGTCTGTGATTAACCCCGTCTTGCAGAGAAGGAAACAAAAGTACAAACAGAAAATGTAACTAAGCATGCAATTAATAAAAAGGGACCAGGTTTTGAACGCGAGCAATCTGGCTCAAGAATCTGCGCCCAACCACCGGCTCCTGTTCTTAGAGATGAACGTGGAGTCCTGGAGACTGCTCAACATTGTGACTTGACTGTGAGCGTACGCGCTCCCTGTCCCCAGGAGACAGATTTCCAGTGCAATCATAGAAAGTGCCTGTGTGGGCTTCGGGAGATGTGTCTGCCTTGGGGAGAATTTTCCTTTTCAGCTAGAGCCAGGCCCAGGATGTTGACGTCAGTGAGACGCTGGTGACGTTCTCTGCTCCAGTGGCTGATGAGAAAAGTTCCTCCAAGCCAGCTCAGTTGAGAAGAATTAAGTTCTCTGGGTCCCACTGGCTTCACCTACAGATGCCAACTTTGAGGCCAGTGAACTGTGAGGCCAGCTGGGCTGATTGCCATGGCAACAGGAATTGGACCAAAGTCACCGGAGGATGGAGAGGGAAGACACAGTGGTGGCTTCCCCAGGTCTTGGACCACAAGGCACAGCCGTGGCCTCCAGGAACCCTGAGATAACCCGTTAGTGGGTCCTGCACTCCAACAGAGCTCATGCAATCAGCCTCTGGTCCTCACCCTCCTCCCATTGGTGTCGTTGTGCTCTCTAACATTGACATTGAGCAGTGAGTGCTCCAGATCTTGTTCCACTGATTTTTTCCACTGTTCTCCAGTCTAGCACTTTCTGAAATTCATCCAAGCCTAAGAGGTGACGCCAAACGTAAGTGTCTTACACCTCGGACCCCATGGACTAAGACAAGCCTCTGGGGTCCATGTGGCACCAAGGATGGGGCCTTCTAGTACCTTTCACACAGGCCAGGGACAGCACCTGCTGCGACCCCCACCCCCAGCCTCTGCTGCTTCTCCCGTTGCCCTTCCAGCCACTGCCCTGGGCACCTCCCCTGCTCCCGCCTCCCTGCCTGGGCCCATCTTTCTTTGCACCTCACCAATTGCGGGGCTTCCTAGTGCTGGAGGGGAAGGGAGCCTGCTTCCATTCTCACCACTCTGAAAGAAGACCCTGCAGAGAGGTTTTCTGGAATTTGGAGCCTAACCTTGGCCTTGACACAGTCCAGATGAGAAGGCCGTCCCCCAGTTAAGCCAGCCCTCCCTCCCTCTCAATGCTGGAGAGGAAACCAGGCAGCTGGTTGCTTCAGCAAACCCCCTCCCTATGGGAATTGTCCTTTTCTTCCTCAAATAGACTGGAGTGCAGAGGACTTGCTTCAGAGAGAGCCCCTTTGTAACGCACATTGCACGGGCCGTGCCCCATGCCCACTCTGCCACAAACTCCCCTCAGCTGCCCAGCCCCGTGGAGCCAGGCGTGGGCTGAAGTGGGGCCAATGAAATGCCTGGAATGCCAGCCGCAGTGACAGGCCAGCACTCAGATGCCTCTCGGGAGTTCTGACCGAAGCAGCACTGAGGACTGCTTCAGAGCAGAAGTCTACGCCATTTTCCCCAGTTCTAGGCAGAAGTAAAGAATGTCTCTACCTTCTCCCAACCAGCAATTGATTCAGAGTCCTGAGCTTTTAAATTAAAGGGACCCCTCTGTTGCTTTATGCAGTAGCCAGCTTATTCATTTGAGTTCAGGTGAAATCATTTTCAAGTAACCTCTTCCTATCCAGCTTTACTTTTAGTTATGCTGACATAAAAACAATAAAAATTGTCCTCCTCAGAGTTCACCTGTAAAAGTTCCTGGATAATTAGTAAGGAAACAGAAAGAGCAGATAGTTGTTGCTTCAGATAAAAGTGATGTCTGGGTTGGGCACGGTGGCGCATGCCTGTAATCCCAGCACTTGGGGAGGCCCAGGTGGATGGATCCCTTGAGCTCAGGAGTTTCAGACCAGCCTGGGCAACATCTCTACAAAAAATACAAAAATTAGCCAGGCATAGTGGCAGGACTGTAGTCCCAGCTACTCAGGAGGCTGAGGTCAGGGGATGGCTTGAGCCCAGGAGGCACAGATTGAAGTGAGCTGAGATTGCGCCACTGTATTCCAGCCTAGGTGACAGAGCCAGACCCTGTCTCAAATTAAAAAAAACTCTTTGTGGTCATTTAATTTACTTCTGCATTCTTTTTTTTTTTTTTTTGAAATGGGCAGTGGTACCATCTCAGCTCACTGCAACCTCTGCCTTGGGGGTTCAAGTGATTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGATTACAGGCACCCGCCACCACGCCCAGCTAATTTTTGTATTTTTAGTAGAGACGGGGCTTTGCCATGTTGACCAGGCTGGACTCAAACTCCTGACCTCAGGTGATCCGCCCACCTCGGCCTCCCAAAGCACTGGGATTACAGGAATGAGCCACTGCACTCGGCCTACTTCTGCATTCCTTAGAGTACATCCTAGCTAGGATATATTCACTTGTCTTTAGAGCTAACAGCAGAAGAAAGGTACCTAGATGCTTATCTAGCTCTTTATCTTTCTAGAAATTCTAGAAGATGAGAGGGGCAGTGGTGGCTCCAAGGGAGTGATTTTAGGATGGACTGGGACAGAGAGGGGCTGCTTACACATACTCACACAGAGGCCATTAATTTAGGGAGTTCAAGGTCCAGGAGGTTGACGGCATCTAGGCCTGTGGCAGAGTGCACTCCTGCTTTGGGGAATGTATGGGCAGCTTCTTGCCTGTAGTTGGAGGGTTAGAGAGAGGGATCAATAATTTCATGGTTGGACTTGAGTTTGGAGCGAGTGGAGTTAGATACAAATTCTATGTTTTTGGAGAAAGTATTTGATCTTCTTGGCTGTGAGGCAAAGCGAGGTTTAAAAATATTTTTCACTTAAAAATATATATATATGCATGTATATTTAATACTGTCTATGGATTGTGCCAATATCTATTTCATGGTTTTGATATTGTGTAGTTATACAAGGAGTTACCACTGAACGAAACTGGGGGAAGGGTACACAGAATCTCTGTACTTTTTTTGTTGTTGTTGCAATTTCCTGTAAATCTATGATTATTTTAAAATAAAAAAGTTAAAGCATACGTATTTACATTTGATTAAATGCAGTGTGATATCCTGGGTTGGATTTTGGAACAAAACAAGGCATGAGTGAAAAAACTGGTAAAATCCAAAAAAGCCTTTAGTTAAAAGTAATACCAGTGTTAATTTCTTAGTTTTGACAAATGTGCCATGGCTGTGTAAGATGCAAATGTTAGAGGAAACTGGGCGAAGAATTTGAGGGAACTCTCTGTACTATTCTTTGCAGCTTTTCTGTAAATCTACAATTATTCCAAAATAAAAGTCTATTAAAAATGTAA +>ENST00000385130 +GGCCAGCTGTGAGTGTTTCTTTGGCAGTGTCTTAGCTGGTTGTTGTGAGCAATAGTAAGGAAGCAATCAGCAAGTATACTGCCCTAGAAGTGCTGCACGTTGTGGGGCCC +>ENST00000437157 +GAGGAATGAGTCCCCCGTTCTCACCCCGGGGAGCGGTTGCCTCGTGAGTCCAAGGAGAATCCGCCCTTTCGTTTTGCGCAGGTGGAGATCTCGCGGGCCCAGTTCGGAGTCCTGCAAACTGTGGAGGAGATGCCGCTGTCCCGTCGGTCTGGGGACAGCCCAGCTCCCCGGATCCCGGGCTGGAGAGACGCGTCGCGGCCCCGGGGCCTGGTGGCACGAGCAGGAAGGAGGACCCGGCGGCGGGCTCTGCCTGGGCTTGCCTGGGCTTGTTCCGAGCCGGGCTGCTTCTCGGTGACCACGCAGATCGGGGGCATTTGGAGATTTTGCGGGAGTCCTGCAGCCAAGCTCCGGGGCAGGAGAGGCCTGGAAGCCTGCACTACCTGCTCGCCCCGTCCCAGCATGCACCCAG diff --git a/pygtftk/data/mini_real_10M/expected_sequence_plus.fa b/pygtftk/data/mini_real_10M/expected_sequence_plus.fa new file mode 100644 index 00000000..4335fd48 --- /dev/null +++ b/pygtftk/data/mini_real_10M/expected_sequence_plus.fa @@ -0,0 +1,40 @@ +>ENST00000624652 +ACGCGTCCGTGCAGCGGAGGCTTCCTGAGCCCCCTGGAGAGCCTGGCCTGGGCCCGGGTGTGGAGACCCTCCCGGGCTTTCAATCCGGGCAGGAGGCAGATGGCAGACTCAGCAGTCACGAATCGCTTAATTCTGAAAGTCTGGTGAGAAGACACGGCGAGAATCGGGGTCCAGCACAGATGATGGCGACAGCGGAGAAGGGAAGGGCTGGGACCTGACGGTGAAGATGCTGGCGGGCAACGAATTCCAGGTGTCCCTGAGCAGCTCCATGTCGGTGTCAGAGCTGAAGGCGCAGATCACCCAGAAGATCGGCGTGCACGCCTTCCAGCAGCGTCTGGCTGTCCACCCGAGCGGTGTGGCGCTGCAGGACAGGGTCCCCCTTGCCAGCCAGGGCCTGGGCCCCGGCAGCACGGTCCTGCTGGTGGTGGACAAATGCGACGAACCTCTGAGCATCCTGGTGAGGAATAACAAGGGCCGCAGCAGCACCTACGAGGTACGGCTGACGCAGACCGTGGCCCACCTGAAGCAGCAAGTGAGCGGGCTGGAGGGTGTGCAGGACGACCTGTTCTGGCTGACCTTCGAGGGGAAGCCCCTGGAGGACCAGCTCCCGCTGGGGGAGTACGGCCTCAAGCCCCTGAGCACCGTGTTCATGAATCT +>ENST00000379389 +CGCAGGCTCGGCGGCACGCCCCCTGACGTGTGTGCCTCAGGCTTATAATAGGGCCGGTGCTGCCTGCCGAAGCCGGCGGCTGAGAGGCAGCGAACTCATCTTTGCCAGTACAGGAGCTTGTGCCGTGGCCCACAGCCCACAGCCCACAGCCATGGGCTGGGACCTGACGGTGAAGATGCTGGCGGGCAACGAATTCCAGGTGTCCCTGAGCAGCTCCATGTCGGTGTCAGAGCTGAAGGCGCAGATCACCCAGAAGATCGGCGTGCACGCCTTCCAGCAGCGTCTGGCTGTCCACCCGAGCGGTGTGGCGCTGCAGGACAGGGTCCCCCTTGCCAGCCAGGGCCTGGGCCCCGGCAGCACGGTCCTGCTGGTGGTGGACAAATGCGACGAACCTCTGAGCATCCTGGTGAGGAATAACAAGGGCCGCAGCAGCACCTACGAGGTACGGCTGACGCAGACCGTGGCCCACCTGAAGCAGCAAGTGAGCGGGCTGGAGGGTGTGCAGGACGACCTGTTCTGGCTGACCTTCGAGGGGAAGCCCCTGGAGGACCAGCTCCCGCTGGGGGAGTACGGCCTCAAGCCCCTGAGCACCGTGTTCATGAATCTGCGCCTGCGGGGAGGCGGCACAGAGCCTGGCGGGCGGAGCTAAGGGCCTCCACCAGCATCCGAGCAGGATCAAGGGCCGGAAATAAAGGCTGTTGTAAAGAGAAA +>ENST00000609981 +GCCCTTTGCTGCGGCAGCTTTCTGTTCTCCCTGGCTCCCTGCACGGAACTGAGCTTTGGTGTGTGATGCGCTGCTGGCCCAGGCTACACCCCGACAAGGGACACCGGGGGCCCCGGGAGCAGAGAGACCTCAGAGCAGCCTCCTCCTGCCTCCTGTGGACGGCCGGCCCCAGCTGGTGATCCCAGCCAGTCCCAGCTTTCAGTTGCTGCCCCCACCGACAGTCCTCAGTCCCTCCATGATGGCTCCCCCGACAGCCGGCCCCCTTCCTGGCCCAGCTCTTCCGCCTGAGGACCCAGGGCCGGATCCGGAGAGCAGGTGGCTTTTCTTGAGCGCCAACATTCTGCCCGTGGTGGAGCGGTGCATGGGTGCCATGCAAGAGGGGATGCAGATGGTGAAGCTGCGTGGCGGCTCCAAGGGCCTGGTCCGCTTCTACTACCTGGACGAGCACCGCTCCTGCATCCGCTGGAGGCCCTCACGCAAGAACGAGAAGGCCAAGATCTCCATCGACTCCATCCAGGAGGTGAGTGAGGGGCGGCAGTCGGAGGTCTTCCAGCGCTACCCTGACGGC +>ENST00000449969 +CACGGGCGGGCGCGGCAGGGCAGCGTGTGGGGCTGCGATCGGCATGGGCTCTGCGCGCGGGGTGCCCCTGCTCGGGCTGGGGCTCAGGGGACGCCGGGGGCCAGCACAGGGCCCGGTGTCCCTCGGGCCGTGCCGGTAACTGGGATTGGCACCCGCCGGCCATGGAAGAGCCTGGGCCCCCAGGTGGGCTCAGCCAAGACCAAGTGGAGCGGTGCATGGGTGCCATGCAAGAGGGGATGCAGATGGTGAAGCTGCGTGGCGGCTCCAAGGGCCTGGTCCGCTTCTACTACCTGGACGAGCACCGCTCCTGCATCCGCTGGAGGCCCTCACGCAAGAACGAGAAGGCCAAGATCTCCATCGACTCCATCCAGGAGGTGAGTGAGGGGCGGCAGTCGGAGGTCTTCCAGCGCTACCCTGACGGCAGCTTCGACCCCAACTGCTGCTTCAGCATCTACCACGGCAGCCACCGCGAGTCGCTGGACCTGGTCTCCACCAGCAGCGAGGTGGCGCGCACCTGGGTCACTGGCCTGCGCTACCTCATGGCCGGCATCAGCGACGAGGACAGCCTGGCTCGCCGCCAGCGCACCAGGGACCAATGGCTGAAGCAGACGTTTGACGAGGCCGACAAGAACGGGGATGGCAGCCTGAGCATTGGCGAGGTCCTGCAGCTGCTGCACAAGCTCAACGTGAACCTGCCCCGGCAGAGGGTGAAGCAGATGTTCAGGGAAGCGGACACGGATGACCACCAAGGGACGCTGGGTTTTGAAGAGTTCTGTGCCTTCTACAAGATGATGTCCACCCGCCGGGACCTCTACCTGCTCATGCTGACCTACAGCAACCACAAGGACCACCTGGATGCCGCCAGCCTGCAGCGCTTCCTGCAGGTGGAGCAGAAGATGGCGGGTGTGACCCTCGAGAGCTGCCAGGACATCATCGAGCAGTTTGAGCCATGCCCAGAAAACAAGAGTAAGGGGCTGCTGGGCATTGATGGCTTCACCAACTACACCAGGAGCCCTGCTGGTGACATCTTCAACCCTGAGCACCACCATGTGCACCAGGACATGACGCAGCCGCTGAGCCACTACTTCATCACCTCGTCCCACAACACCTACCTCGTGGGTGACCAGCTCATGTCCCAGTCACGGGTGGACATGTATGCTTGGGTCCTGCAGGCTGGCTGCCGCTGCGTGGAGGTGGACTGCTGGGATGGGCCCGACGGGGAGCCCATTGTGCACCATGGCTACACTCTGACTTCCAAGATCCTCTTCAAAGACGTCATTGAAACCATCAACAAATATGCCTTCATCAAGAATGAGTACCCAGTGATCCTGTCCATCGAAAACCACTGCAGTGTCATCCAGCAGAAGAAAATGGCCCAGTATCTGACTGACATCCTTGGGGACAAGCTGGACCTGTCATCAGTGAGCAGTGAAGATGCCACCACACTCCCCTCTCCACAGATGCTCAAGGGCAAGATCCTCGTGAAGGGGAAGAAGCTCCCAGCCAACATCAGCGAGGATGCGGAGGAAGGCGAGGTGTCTGATGAGGACAGTGCTGATGAGATTGACGATGACTGCAAGCTCCTCAATGGGGATGCATCCACCAATCGAAAGCGTGTAGAAAACACTGCTAAGAGGAAACTGGATTCCCTCATCAAAGAGTCGAAGATTCGGGACTGTGAGGACCCCAACAACTTCTCCGTCTCCACACTGTCCCCATCTGGAAAGCTCGGACGCAAGAGCAAGGCTGAAGAGGACGTGGAGTCTGGGGAGGATGCCGGGGCCAGCAGACGCAATGGCCGCCTCGTCGTGGGAAGCTTCTCCAGGCGCAAGAAGAAGGGCAGCAAGCTGAAGAAGGCGGCCAGCGTGGAGGAGGGAGATGAGGGTCAGGACTCCCCGGGAGGCCAGAGCCGAGGGGCGACCCGGCAGAAGAAGACCATGAAGCTGTCCCGGGCCCTCTCTGACCTGGTGAAGTACACCAAGTCCGTGGCCACCCACGACATAGAGATGGAGGCGGCGTCCAGCTGGCAGGTGTCGTCCTTCAGCGAGACCAAGGCCCACCAGATTCTGCAGCAGAAGCCGGCGCAGTACCTACGCTTCAACCAGCAGCAGCTCTCCCGCATCTACCCCTCCTCCTACCGTGTGGACTCCAGCAACTACAACCCGCAGCCCTTCTGGAACGCCGGCTGCCAAATGGTTGCCCTGAACTACCAGTCAGAGGGGCGGATGCTGCAGCTGAACCGAGCCAAGTTCAGCGCCAACGGTGGCTGCGGCTACGTACTCAAGCCTGGGTGCATGTGCCAGGGCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACGGGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAGGCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGGTAAGGCGCCAGCTGCGGTGGCAGAGAAGAGCCCTGTGCGAGTGCGGCCCCCGCGTGTCCTGGACGGCCCCGGGCCTGCTGGGATGGCCGCCACATGCATGAAGTGTGTGGTGGGATCCTGCGCCGGCGTGAACACCGGGGGCCTGCAGAGGGAGCGGCCACCCAGCCCGGGGCCTGCAAGCAGGCAGGCAGCCATTCGCCAGCAGCCCCGGGCCCGGGCTGACTCACTGGGGGCCCCCTGCTGTGGCCTGGACCCTCACGCTATCCCGGGGAGAAGCAGAGAGGCCCCCAAGGGTCCTGGGGCCTGGAGGCAGGGTCCAGGCGGTAGCGGCTCCATGTCCTCGGACTCCAGCAGCCCAGACAGCCCGGGCATCCCCGAAAGGTCCCCCCGCTGGCCTGAGGGTGCCTGCAGGCAACCGGGGGCCCTGCAGGGAGAGATGAGTGCCTTGTTTGCTCAAAAGCTGGAGGAGATCAGGAGTAAATCCCCCATGTTCTCCGCCGTTAGGAACTGAGAGCGGCGAGTGACAGGTAACGGGGCCCAGCCCCGGTGTCCCGTGCTGTCCCAGCCCAAGGAGGGCCCCGTGTGCGGCACAGGGCGTGGACTGGGCCCCAGCAGCAGCAGGGTGGGGACACCGAGTGTGCCGCGCCCGGGGGATGCCTCGGGGTGGGAGCTGGGCCTGGCGACCCTCGGCACAGGGCACCGGGGACACCACCCTGATCCGACTCCTCTCCGCCTCTCTCCCTGCCTCCCTCTCTCTCTTCTGCTTCTCCCTCTGGCTCTCTCTCACTCCCCCACCTCCCCACAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCCC +>ENST00000419816 +GCGGCTGCGTCAGGGATTCCTTGGTGGCCCTGGAGGGTGGATAGGCTGGCCTGGGGGCCATCAGGACAGCAGGTGACGGTCAGGCCAATGCCAGCCGGGCCTGGGCACAGCCCTGTGGGGGCTTCGGAGGGCCCTGAGGAGGAGGAGGAAGAGGCAGAGGAGAGAAGGCCCCACGGAGGTCCTGTCGCCAGCGCTGCCACTGCCTGACCTCCGCTGCCCGAAGGCCGGTGGGCCTCTGTGGCCTCCGTGAAGCAGGCCCGGCTGTCGTCAGGCCATGTCTGGTCCATGGCCCTCCCCCGACAGCCGGACCAAGGGAACGGTGGCCTGGCTGGCGGAGGTACTCCTCTGGGTTGGAGGGAGTGTGGTGCTGTCTTCAGAGTGGCAGCTCGGCCCCCTGGTGGAGCGGTGCATGGGTGCCATGCAAGAGGGGATGCAGATGGTGAAGCTGCGTGGCGGCTCCAAGGGCCTGGTCCGCTTCTACTACCTGGACGAGCACCGCTCCTGCATCCGCTGGAGGCCCTCACGCAAGAACGAGAAGGCCAAGATCTCCATCGACTCCATCCAGGAGGTGAGTGAGGGGCGGCAGTCGGAGGTCTTCCAGCGCTACCCTGACGGCAGCTTCGACCCCAACTGCTGCTTCAGCATCTACCACGGCAGCCACCGCGAGTCGCTGGACCTGGTCTCCACCAGCAGCGAGGTGGCGCGCACCTGGGTCACTGGCCTGCGCTACCTCATGGCCGGCATCAGCGACGAGGACAGCCTGGCTCGCCGCCAGCGCACCAGGGACCAATGGCTGAAGCAGACGTTTGACGAGGCCGACAAGAACGGGGATGGCAGCCTGAGCATTGGCGAGGTCCTGCAGCTGCTGCACAAGCTCAACGTGAACCTGCCCCGGCAGAGGGTGAAGCAGATGTTCAGGGAAGCGGACACGGATGACCACCAAGGGACGCTGGGTTTTGAAGAGTTCTGTGCCTTCTACAAGATGATGTCCACCCGCCGGGACCTCTACCTGCTCATGCTGACCTACAGCAACCACAAGGACCACCTGGATGCCGCCAGCCTGCAGCGCTTCCTGCAGGTGGAGCAGAAGATGGCGGGTGTGACCCTCGAGAGCTGCCAGGACATCATCGAGCAGTTTGAGCCATGCCCAGAAAACAAGAGTAAGGGGCTGCTGGGCATTGATGGCTTCACCAACTACACCAGGAGCCCTGCTGGTGACATCTTCAACCCTGAGCACCACCATGTGCACCAGGACATGACGCAGCCGCTGAGCCACTACTTCATCACCTCGTCCCACAACACCTACCTCGTGGGTGACCAGCTCATGTCCCAGTCACGGGTGGACATGTATGCTTGGGTCCTGCAGGCTGGCTGCCGCTGCGTGGAGGTGGACTGCTGGGATGGGCCCGACGGGGAGCCCATTGTGCACCATGGCTACACTCTGACTTCCAAGATCCTCTTCAAAGACGTCATTGAAACCATCAACAAATATGCCTTCATCAAGAATGAGTACCCAGTGATCCTGTCCATCGAAAACCACTGCAGTGTCATCCAGCAGAAGAAAATGGCCCAGTATCTGACTGACATCCTTGGGGACAAGCTGGACCTGTCATCAGTGAGCAGTGAAGATGCCACCACACTCCCCTCTCCACAGATGCTCAAGGGCAAGATCCTCGTGAAGGGGAAGAAGCTCCCAGCCAACATCAGCGAGGATGCGGAGGAAGGCGAGGTGTCTGATGAGGACAGTGCTGATGAGATTGACGATGACTGCAAGCTCCTCAATGGGGATGCATCCACCAATCGAAAGCGTGTAGAAAACACTGCTAAGAGGAAACTGGATTCCCTCATCAAAGAGTCGAAGATTCGGGACTGTGAGGACCCCAACAACTTCTCCGTCTCCACACTGTCCCCATCTGGAAAGCTCGGACGCAAGAGCAAGGCTGAAGAGGACGTGGAGTCTGGGGAGGATGCCGGGGCCAGCAGACGCAATGGCCGCCTCGTCGTGGGAAGCTTCTCCAGGCGCAAGAAGAAGGGCAGCAAGCTGAAGAAGGCGGCCAGCGTGGAGGAGGGAGATGAGGGTCAGGACTCCCCGGGAGGCCAGAGCCGAGGGGCGACCCGGCAGAAGAAGACCATGAAGCTGTCCCGGGCCCTCTCTGACCTGGTGAAGTACACCAAGTCCGTGGCCACCCACGACATAGAGATGGAGGCGGCGTCCAGCTGGCAGGTGTCGTCCTTCAGCGAGACCAAGGCCCACCAGATTCTGCAGCAGAAGCCGGCGCAGTACCTACGCTTCAACCAGCAGCAGCTCTCCCGCATCTACCCCTCCTCCTACCGTGTGGACTCCAGCAACTACAACCCGCAGCCCTTCTGGAACGCCGGCTGCCAAATGGTTGCCCTGAACTACCAGTCAGAGGGGCGGATGCTGCAGCTGAACCGAGCCAAGTTCAGCGCCAACGGTGGCTGCGGCTACGTACTCAAGCCTGGGTGCATGTGCCAGGGCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACGGGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAGGCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCC +>ENST00000378486 +GCGGCTGCGTCAGGGATTCCTTGGTGGCCCTGGAGGGTGGATAGGCTGGCCTGGGGGCCATCAGGACAGCAGGTGACGGTCAGGCCAATGCCAGCCGGGCCTGGGCACAGCCCTGTGGGGGCTTCGGAGGGCCCTGAGGAGGAGGAGGAAGAGGCAGAGGAGAGAAGGCCCCACGGAGGTCCTGTCGCCAGCGCTGCCACTGCCTGACCTCCGCTGCCCGAAGGCCGGTGGGCCTCTGTGGCCTCCGTGAAGCAGGCCCGGCTGTCGTCAGGCCATGTCTGGTCCATGGCCCTCCCCCGACAGCCGGACCAAGGGAACGGTGGCCTGGCTGGCGGAGGTACTCCTCTGGGTTGGAGGGAGTGTGGTGCTGTCTTCAGAGTGGCAGCTCGGCCCCCTGGTGGAGCGGTGCATGGGTGCCATGCAAGAGGGGATGCAGATGGTGAAGCTGCGTGGCGGCTCCAAGGGCCTGGTCCGCTTCTACTACCTGGACGAGCACCGCTCCTGCATCCGCTGGAGGCCCTCACGCAAGAACGAGAAGGCCAAGATCTCCATCGACTCCATCCAGGAGGTGAGTGAGGGGCGGCAGTCGGAGGTCTTCCAGCGCTACCCTGACGGCAGCTTCGACCCCAACTGCTGCTTCAGCATCTACCACGGCAGCCACCGCGAGTCGCTGGACCTGGTCTCCACCAGCAGCGAGGTGGCGCGCACCTGGGTCACTGGCCTGCGCTACCTCATGGCCGGCATCAGCGACGAGGACAGCCTGGCTCGCCGCCAGCGCACCAGGGACCAGTGGCTGAAGCAGACGTTTGACGAGGCCGACAAGAACGGGGATGGCAGCCTGAGCATTGGCGAGGTCCTGCAGCTGCTGCACAAGCTCAACGTGAACCTGCCCCGGCAGAGGGTGAAGCAGATGTTCAGGGAAGCGGACACGGATGACCACCAAGGGACGCTGGGTTTTGAAGAGTTCTGTGCCTTCTACAAGATGATGTCCACCCGCCGGGACCTCTACCTGCTCATGCTGACCTACAGCAACCACAAGGACCACCTGGATGCCGCCAGCCTGCAGCGCTTCCTGCAGGTGGAGCAGAAGATGGCGGGTGTGACCCTCGAGAGCTGCCAGGACATCATCGAGCAGTTTGAGCCATGCCCAGAAAACAAGAGTAAGGGGCTGCTGGGCATTGATGGCTTCACCAACTACACCAGGAGCCCTGCTGGTGACATCTTCAACCCTGAGCACCACCATGTGCACCAGGACATGACGCAGCCGCTGAGCCACTACTTCATCACCTCGTCCCACAACACCTACCTCGTGGGTGACCAGCTCATGTCCCAGTCACGGGTGGACATGTATGCTTGGGTCCTGCAGGCTGGCTGCCGCTGCGTGGAGGTGGACTGCTGGGATGGGCCCGACGGGGAGCCCATTGTGCACCATGGCTACACTCTGACTTCCAAGATCCTCTTCAAAGACGTCATTGAAACCATCAACAAATATGCCTTCATCAAGAATGAGTACCCAGTGATCCTGTCCATCGAAAACCACTGCAGTGTCATCCAGCAGAAGAAAATGGCCCAGTATCTGACTGACATCCTTGGGGACAAGCTGGACCTGTCATCAGTGAGCAGTGAAGATGCCACCACACTCCCCTCTCCACAGATGCTCAAGGGCAAGATCCTCGTGAAGGGGAAGAAGCTCCCAGCCAACATCAGCGAGGATGCGGAGGAAGGCGAGGTGTCTGATGAGGACAGTGCTGATGAGATTGACGATGACTGCAAGCTCCTCAATGGGGATGCATCCACCAATCGAAAGCGTGTAGAAAACACTGCTAAGAGGAAACTGGATTCCCTCATCAAAGAGTCGAAGATTCGGGACTGTGAGGACCCCAACAACTTCTCCGTCTCCACACTGTCCCCATCTGGAAAGCTCGGACGCAAGAGCAAGGCTGAAGAGGACGTGGAGTCTGGGGAGGATGCCGGGGCCAGCAGACGCAATGGCCGCCTCGTCGTGGGAAGCTTCTCCAGGCGCAAGAAGAAGGGCAGCAAGCTGAAGAAGGCGGCCAGCGTGGAGGAGGGAGATGAGGGTCAGGACTCCCCGGGAGGCCAGAGCCGAGGGGCGACCCGGCAGAAGAAGACCATGAAGCTGTCCCGGGCCCTCTCTGACCTGGTGAAGTACACCAAGTCCGTGGCCACCCACGACATAGAGATGGAGGCGGCGTCCAGCTGGCAGGTGTCGTCCTTCAGCGAGACCAAGGCCCACCAGATTCTGCAGCAGAAGCCGGCGCAGTACCTACGCTTCAACCAGCAGCAGCTCTCCCGCATCTACCCCTCCTCCTACCGTGTGGACTCCAGCAACTACAACCCGCAGCCCTTCTGGAACGCCGGCTGCCAAATGGTTGCCCTGAACTACCAGTCAGAGGGGCGGATGCTGCAGCTGAACCGAGCCAAGTTCAGCGCCAACGGTGGCTGCGGCTACGTACTCAAGCCTGGGTGCATGTGCCAGGGCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACGGGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAGGCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCC +>ENST00000343889 +CACAGGGAACGGGTAGGGTCCCACGGTTTGGGGAGAGACATGGCAGTCCTCAAGGGCTGGGATCAGGGCGCAGCCAGGGTTTCTGATGGCTTTGCTGATGGTCAGGACCCAGGCATGCCAGGCAAGGCCTCAGCCCAGCAGTTGCCAAGCGTGTAGCCACTTTGGGCCCGTGGAGAGAGTCGCGCTGCGGAGCCCCCAGGGGGACCTGAGGTCACAAGAGCCTCGATGCACCTGAGCGCGGAGCTGGGGGTCCCTGGAGCCGCTGTCCCCACCTGCGGCGCTGGAGCCCTGGAGGTGTCCAGGGGCTTCCTTGGAACGTGGAGACGTGCTGGTTAAACGTGGAGCCCCGGGCCAGCCGGGCACTGGGGGCTGCAGGTGGAGGGAGGTGGATGCTCTCCCTCGTGGGGGCGTGTCTTTTCCACAGGAAAGGGAAAGGGGGAGGGACACGGGTCAGCAGTGGGGGGCTGTGCAGTCTCGCAGATCTTCACCCTTGGTTCTTGAACTCTGGACCCTGAGCCCTGCCGAGGGTCCCGCAAAGGTGGGCAAGGAGCTCCCGGCTGCTTGGTCTCCGCAGTGTTGGGGCTGCCAGCAGGGGGACGCTGGGCCCCCGGGGACCTGACCCGTGCTCCCTCCCCACCCCGCAGTCTCCATCGACTCCATCCAGGAGGTGAGTGAGGGGCGGCAGTCGGAGGTCTTCCAGCGCTACCCTGACGGCAGCTTCGACCCCAACTGCTGCTTCAGCATCTACCACGGCAGCCACCGCGAGTCGCTGGACCTGGTCTCCACCAGCAGCGAGGTGGCGCGCACCTGGGTCACTGGCCTGCGCTACCTCATGGCCGGCATCAGCGACGAGGACAGCCTGGCTCGCCGCCAGCGCACCAGGGACCAATGGCTGAAGCAGACGTTTGACGAGGCCGACAAGAACGGGGATGGCAGCCTGAGCATTGGCGAGGTCCTGCAGCTGCTGCACAAGCTCAACGTGAACCTGCCCCGGCAGAGGGTGAAGCAGATGTTCAGGGAAGCGGACACGGATGACCACCAAGGGACGCTGGGTTTTGAAGAGTTCTGTGCCTTCTACAAGATGATGTCCACCCGCCGGGACCTCTACCTGCTCATGCTGACCTACAGCAACCACAAGGACCACCTGGATGCCGCCAGCCTGCAGCGCTTCCTGCAGGTGGAGCAGAAGATGGCGGGTGTGACCCTCGAGAGCTGCCAGGACATCATCGAGCAGTTTGAGCCATGCCCAGAAAACAAGAGTAAGGGGCTGCTGGGCATTGATGGCTTCACCAACTACACCAGGAGCCCTGCTGGTGACATCTTCAACCCTGAGCACCACCATGTGCACCAGGACATGACGCAGCCGCTGAGCCACTACTTCATCACCTCGTCCCACAACACCTACCTCGTGGGTGACCAGCTCATGTCCCAGTCACGGGTGGACATGTATGCTTGGGTCCTGCAGGCTGGCTGCCGCTGCGTGGAGGTGGACTGCTGGGATGGGCCCGACGGGGAGCCCATTGTGCACCATGGCTACACTCTGACTTCCAAGATCCTCTTCAAAGACGTCATTGAAACCATCAACAAATATGCCTTCATCAAGAATGAGTACCCAGTGATCCTGTCCATCGAAAACCACTGCAGTGTCATCCAGCAGAAGAAAATGGCCCAGTATCTGACTGACATCCTTGGGGACAAGCTGGACCTGTCATCAGTGAGCAGTGAAGATGCCACCACACTCCCCTCTCCACAGATGCTCAAGGGCAAGATCCTCGTGAAGGGGAAGAAGCTCCCAGCCAACATCAGCGAGGATGCGGAGGAAGGCGAGGTGTCTGATGAGGACAGTGCTGATGAGATTGACGATGACTGCAAGCTCCTCAATGGGGATGCATCCACCAATCGAAAGCGTGTAGAAAACACTGCTAAGAGGAAACTGGATTCCCTCATCAAAGAGTCGAAGATTCGGGACTGTGAGGACCCCAACAACTTCTCCGTCTCCACACTGTCCCCATCTGGAAAGCTCGGACGCAAGAGCAAGGCTGAAGAGGACGTGGAGTCTGGGGAGGATGCCGGGGCCAGCAGACGCAATGGCCGCCTCGTCGTGGGAAGCTTCTCCAGGCGCAAGAAGAAGGGCAGCAAGCTGAAGAAGGCGGCCAGCGTGGAGGAGGGAGATGAGGGTCAGGACTCCCCGGGAGGCCAGAGCCGAGGGGCGACCCGGCAGAAGAAGACCATGAAGCTGTCCCGGGCCCTCTCTGACCTGGTGAAGTACACCAAGTCCGTGGCCACCCACGACATAGAGATGGAGGCGGCGTCCAGCTGGCAGGTGTCGTCCTTCAGCGAGACCAAGGCCCACCAGATTCTGCAGCAGAAGCCGGCGCAGTACCTACGCTTCAACCAGCAGCAGCTCTCCCGCATCTACCCCTCCTCCTACCGTGTGGACTCCAGCAACTACAACCCGCAGCCCTTCTGGAACGCCGGCTGCCAAATGGTTGCCCTGAACTACCAGTCAGAGGGGCGGATGCTGCAGCTGAACCGAGCCAAGTTCAGCGCCAACGGTGGCTGCGGCTACGTACTCAAGCCTGGGTGCATGTGCCAGGGCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACGGGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAGGCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGGTAAGGCGCCAGCTGCGGTGGCAGAGAAGAGCCCTGTGCGAGTGCGGCCCCCGCGTGTCCTGGACGGCCCCGGGCCTGCTGGGATGGCCGCCACATGCATGAAGTGTGTGGTGGGATCCTGCGCCGGCGTGAACACCGGGGGCCTGCAGAGGGAGCGGCCACCCAGCCCGGGGCCTGCAAGCAGGCAGGCAGCCATTCGCCAGCAGCCCCGGGCCCGGGCTGACTCACTGGGGGCCCCCTGCTGTGGCCTGGACCCTCACGCTATCCCGGGGAGAAGCAGAGAGGCCCCCAAGGGTCCTGGGGCCTGGAGGCAGGGTCCAGGCGGTAGCGGCTCCATGTCCTCGGACTCCAGCAGCCCAGACAGCCCGGGCATCCCCGAAAGGTCCCCCCGCTGGCCTGAGGGTGCCTGCAGGCAACCGGGGGCCCTGCAGGGAGAGATGAGTGCCTTGTTTGCTCAAAAGCTGGAGGAGATCAGGAGTAAATCCCCCATGTTCTCCGCCGGTAAGCCCCTCTTGCCCTGCGTGGTCCTCCCGCACGCCCCTGGCATGGCTGGGCCTGGGTCACCTGCTGCTGCTTCTGCGTGGACGGTGTCGCCTCGTGTGCTCGTGCTCGTGGCTCTGTATCCGTGGCACTGTCTCCGTGGCACTCTGCTCCCTTGGCTTGCCTGTGGCCCATAGCCCCAGCCCTCCTGTCTGAGCTTGAGGCCCTGGGACTTGGGTGGAGCTGGTTTGAGGCCCGACAGGCTGGGAAGAACCAGCTGCTCTTGCTGAGGGTCTGGGGCCGGGACTGTGGCCTGACATGCTGGGCCCCTCCGGCTGGGCGCTTCCCCAAACTCACCTCCTGGGCGGCTGGCGACCTGCATGGCCCCTGATGCCTTTCCTGGGACTGGGGGCCACGTACCATCCCATTCCCACCTCCCTCTAGGGCAGGCTCCAGGGGTCCCTACTGGGAAGTCTGATGTGGGCAGGTAGTGCAGCTGCTGGGCGTCTCCTGCGCCCCTGGGACGCCTGGAGCCTGCTGAGTGCTGCGTGGAGTAGATTCCCTGGGCCCCAGGGCTTCGCTGCTTTGGGCTGAAGCACCCCACTAGAAGGGTGTCTCCTTAGCCTGGAGGGAGGGACATACACGGAGCCCGCCCCACACCACCCTGCCCCTCCAGACCCCCCTGACCAAGCTTTCCTTTCTGCCCCCACCCACGCTGCCTCCGTAGTTAGGAACTGAGAGCGGCGAGTGACAGGTAACGGGGCCCAGCCCCGGTGTCCCGTGCTGTCCCAGCCCAAGGAGGGCCCCGTGTGCGGCACAGGGCGTGGACTGGGCCCCAGCAGCAGCAGGGTGGGGACACCGAGTGTGCCGCGCCCGGGGGATGCCTCGGGGTGGGAGCTGGGCCTGGCGACCCTCGGCACAGGGCACCGGGGACACCACCCTGATCCGACTCCTCTCCGCCTCTCTCCCTGCCTCCCTCTCTCTCTTCTGCTTCTCCCTCTGGCTCTCTCTCACTCCCCCACCTCCCCACAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCCCTTTC +>ENST00000278878 +GGCGCGCACCTGGGTCACTGGCCTGCGCTACCTCATGGCCGGCATCAGCGACGAGGACAGCCTGGCTCGCCGCCAGCGCACCAGGGACCAATGGCTGAAGCAGACGTTTGACGAGGCCGACAAGAACGGGGATGGCAGCCTGAGCATTGGCGAGGTCCTGCAGCTGCTGCACAAGCTCAACGTGAACCTGCCCCGGCAGAGGGTGAAGCAGATGTTCAGGGAAGCGGACACGGATGACCACCAAGGGACGCTGGGTTTTGAAGAGTTCTGTGCCTTCTACAAGATGATGTCCACCCGCCGGGACCTCTACCTGCTCATGCTGACCTACAGCAACCACAAGGACCACCTGGATGCCGCCAGCCTGCAGCGCTTCCTGCAGGTGGAGCAGAAGATGGCGGGTGTGACCCTCGAGAGCTGCCAGGACATCATCGAGCAGTTTGAGCCATGCCCAGAAAACAAGAGTAAGGGGCTGCTGGGCATTGATGGCTTCACCAACTACACCAGGAGCCCTGCTGGTGACATCTTCAACCCTGAGCACCACCATGTGCACCAGGACATGACGCAGCCGCTGAGCCACTACTTCATCACCTCGTCCCACAACACCTACCTCGTGGGTGACCAGCTCATGTCCCAGTCACGGGTGGACATGTATGCTTGGGTCCTGCAGGCTGGCTGCCGCTGCGTGGAGGTGGACTGCTGGGATGGGCCCGACGGGGAGCCCATTGTGCACCATGGCTACACTCTGACTTCCAAGATCCTCTTCAAAGACGTCATTGAAACCATCAACAAATATGCCTTCATCAAGAATGAGTACCCAGTGATCCTGTCCATCGAAAACCACTGCAGTGTCATCCAGCAGAAGAAAATGGCCCAGTATCTGACTGACATCCTTGGGGACAAGCTGGACCTGTCATCAGTGAGCAGTGAAGATGCCACCACACTCCCCTCTCCACAGATGCTCAAGGGCAAGATCCTCGTGAAGGGGAAGAAGCTCCCAGCCAACATCAGCGAGGATGCGGAGGAAGGCGAGGTGTCTGATGAGGACAGTGCTGATGAGATTGACGATGACTGCAAGCTCCTCAATGGGGATGCATCCACCAATCGAAAGCGTGTAGAAAACACTGCTAAGAGGAAACTGGATTCCCTCATCAAAGAGTCGAAGATTCGGGACTGTGAGGACCCCAACAACTTCTCCGTCTCCACACTGTCCCCATCTGGAAAGCTCGGACGCAAGAGCAAGGCTGAAGAGGACGTGGAGTCTGGGGAGGATGCCGGGGCCAGCAGACGCAATGGCCGCCTCGTCGTGGGAAGCTTCTCCAGGCGCAAGAAGAAGGGCAGCAAGCTGAAGAAGGCGGCCAGCGTGGAGGAGGGAGATGAGGGTCAGGACTCCCCGGGAGGCCAGAGCCGAGGGGCGACCCGGCAGAAGAAGACCATGAAGCTGTCCCGGGCCCTCTCTGACCTGGTGAAGTACACCAAGTCCGTGGCCACCCACGACATAGAGATGGAGGCGGCGTCCAGCTGGCAGGTGTCGTCCTTCAGCGAGACCAAGGCCCACCAGATTCTGCAGCAGAAGCCGGCGCAGTACCTACGCTTCAACCAGCAGCAGCTCTCCCGCATCTACCCCTCCTCCTACCGTGTGGACTCCAGCAACTACAACCCGCAGCCCTTCTGGAACGCCGGCTGCCAAATGGGCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACGGGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAGGCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGC +>ENST00000473964 +GTGGGGGAACCCTCCTTGCTAGCGTTGCAAAGAAGGGCCCAGCTCCGTCAGGAATCCAGGGATGGAGAACTGGGGAGCCTGGGCCCCACATGAGATTCATGGCAGGACTTGTCTGAGGGGCCCCAGTGCCAGCGACCCAGCCCCCTGTGCCTGGCCCCTCTGTGGGTCTCAGGACCTGGGTCTGGGCTGGGTGTTTGGAGGAACCTCCTCCCGGCTCTCAGACACCTCTGTTTTGTCTGCTGTGGATGACTTCCAGCTTGGTCCCCCTGTGGCCCTGGCAGGAGTATCACCATGGGAGAGGGCAGGACAGGGGCTGGGCGAGCAGGCCTCCCACTAGACCAGGCTACTCCTGCTGTGGACCAGCTACTTCCACCTCTGCCCTTGGCTTGCCCTCCTCAGAGTTCTCAGCCTGAGTGGGCCCTGGGGACACTGTCACCAGAGACCCCACCCCTCATACCCCCAGGGACCCAGACCCACCCCCAGAAGCCATGTGACCTCCTCGGCTCAGCTGTGGGAGGCATGGGCTCTGTCCCACATGCTGCGGTAGCCACAAAGGTGATCCATACTGGGCCAGGTGCACCCCGAGGTGCCCCCCTGGACCACTGCCTCCCTCCCTCCCCCTGGCACCGGCTCCAGTCTCCTATGTGGGGGCTGGGGAGGGGGCTGTTGGCAGCCATGCCCCAGCAAGCAGGGGGCTTGCTGAGGGCTGGGCCACTGACCACCTCCCCGGCATCCCCTCAGGCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACGGGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAGGCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTGAGTGTCACCCCCTGCCACCAGCCATCATGGGGAGGGGCCACACCAGCCCCTTGTCCCATGCCCCCCCATGTGTCCCCAGTGCTGGGTCCTGAACTCAGGCAGTGAGGCCTAGGGTCCCCTCCCCGGGCCTCTGCTCCTCTATCTCAAGAGGGGCTGCTGTGGGGGCCTGGCTCCTGAGCCACCAGTGCCCACCTCTGATCTCAGGGCTGGCTTTGGGCATCTCGGGCAGGACAGGTCCTGAGTGCTCCGGGCCTTGCCCCGCCCTGTGTCACCCATGCCTGTCTCAGACTCTTGGGGGCCTTGCAGCCTCCACCCCTACAGTGCTGCCATCTGGCTTCTCAGCAGGGACCGAGTGATGCCCCTCTCCCCTCTACTACCCCCCACCCCTCTACTTCCTGGTGTCACGTGGAAGGCAGCTGCCCGGGTTTGCCTGTGACTCCACACCCAGCATGTCTGTCCCCTGCCCCAGGTCAGGGTGGGGCCTCGGCTTCCGCAGGAAGTGGTCTTGGTGCCAGCCCTGCTGCCCTGGCTTTGAGCTGGGGCCCAGTGCCCTCTGGGTCCTGCTGGCTGCAGCTGGCCCTCGGGGAACCCGCACACACAGCAGGAGGGGCCTGCCCAGGCCCAGTGCTGACTCTCTCCTGCCATGCTCTCGGGCCCAGAGGTGCCATCCAGCCCCTGCCGTCTATCCACCCATCTGTTCCTCGTCCCCCAGGCTGCAGGGCTCCCCACGCCACTGCTGTGGCCGCCTCACCTGCTCCCCCTGTCTCTTTGGTCTTGCAGTCGGCTTCTCTATGGCCACAGCCTACTTTTAGAAGTGCAGCTCTGTTAGGAGCCTTGAAGGTACCCGGTGCGCGGGACAGTGCGGCCCGCCGCCCCTGCATGCCCAGGCCGCACCCCATTAGCATCCATGATTCCTGGTAGCATTTGGAGACTGTCGCTCATGTGACGTGGATCATGACATGGCTCCGGGGGCCCTGGCCATCCCCAGCCATAGTGGCATTTACGAGGCAGATCCAGGGTTCAGCTGGGTGGCCGCCTTCTCACTGGCCTCTCCTCCCCTCCCCTCCCTCAGTCCTCCCTCCCCTCCCTCAGTCCTCCCTCCCCTCCCTCAGTCCTCCCTCCCCTCCCTCAGTCCTCCCTCCCCTCCCTCAGCCCCTTCCCTGGCGGGCAGCCCGCTGGAGCCCCCACTGTGCCCCTCCTATCCCCCTCCTTCTCTCTCCTGCCCCCATCTCGGACCCTCAGGCTGTTGGTTCTGAGTTCGCCTCCCACTCCCTCCCTGTCCTTGCCAACCATGCCAGTGCATGGGATGAGGGCACCCCTGAGGCCGGCGCTCCGAGCCAGAATCCCGGATCTGCTTCTAAATGGCTTCCCAGCCACTGTGACCAAATGCGTAGATTTGGGATCTTGAATCAGGAAGCTGATTCAAGTGCTGGCCATCTGAACGCATCTGCCCAGAGGCGCCCCTGCAGGGGGGTGACCCACCTGCCGGGCCTGGGCCGCTCTGTGCACGAGCACGGCTCGTCATGGGGGCGCGGTGGGTGCTGTCTCGGGGGCATCTGGCATGTGAGGGCCCCTCTGGCCTCTGCGCCCTGGAGATGCGGCTGCCTCCCTCTCAGCAGCTGTTCTGCCCAGGCAGGGACCTCCTGGGCCCAGCTGTCCAGGAAGATTGGCTGTGGCCAGGTGCTGGTGGGCTGGGAGTCTGAGCCCATCTTGGCAGGGCTCAGGGGGCAGCAAGCCAGCTGCGGGCCTTGGGGGCTCACATGAGTGGAGGGCAGGGCAAGACCAGAAAAGGCTGCCTGGGGGAATTCAGGAAGGCTTCCTGGAAGAGGTGGTACTTCCTAGGGCACGAGTATCACCATGGGAGTGGGCAGGACACGGGCCGGGCAAGTGGGCCTCCCGCTGCACCTGGCTACTCCTGCTGTGGACCAGCTACTCCTGCCTGAGGGTGGGGCACACACAACCAGGGAGTGCCACGCCAGTGTCCCCTGCTAGCGCCGGGGGCTGCGGGCCTCTGAGCAGGTGCAGGCTGTGGTGGGCCAGGCTGGGGCTCGAGGTCTCTCCTCCGGAGGGAAAGACCTTCTCTCCATGCCCCTCAAGGGCCCCACATGCCCTGGACAGGTCAGGCGAGGGCAGTTTCTGCCGGAAGGGTGGGGTGGGCCATGTGTACTTAGATCTGTAGCAGCTACTGTCCCAGGCAGAGCTGCCCTAGGGACCCTGCTCCTGAAGGCCCTGGTGTGTCCACACACCCCCAGCCTGAGGTGGCCCAGCCCCTCGGACCGAGACACGCATGGCACGTCTGTGGCACGGTCTGGAGAGCTGGCCCTGGGGGAGCAGCTGCAGCTGGGCTGGGACCCCTGGCAACAGCTACATGGGCTCCTTCTCTTGCAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGGTAAGGCGCCAGCTGCGGTGGCAGAGAAGAGCCCTGTGCGAGTGCGGCCCCCGCGTGTCCTGGACGGCCCCGGGCCTGCTGGGATGGCCGCCACATGCATGAAGTGTGTGGTGGGATCCTGCGCCGGCGTGAACACCGGGGGCCTGCAGAGGGAGCGGCCACCCAGCCCGGGGCCTGCAAGCAGGCAGGCAGCCATTCGCCAGCAGCCCCGGGCCCGGGCTGACTCACTGGGGGCCCCCTGCTGTGGCCTGGACCCTCACGCTATCCCGGGGAGAAGCAGAGAGGCCCCCAAGGGTCCTGGGGCCTGGAGGCAGGGTCCAGGCGGTAGCGGCTCCATGTCCTCGGACTCCAGCAGCCCAGACAGCCCGGGCATCCCCGAAAGGTCCCCCCGCTGGCCTGAGGGTGCCTGCAGGCAACCGGGGGCCCTGCAGGGAGAGATGAGTGCCTTGTTTGCTCAAAAGCTGGAGGAGATCAGGAGTAAATCCCCCATGTTCTCCGCCGGTAAGCCCCTCTTGCCCTGCGTGGTCCTCCCGCACGCCCCTGGCATGGCTGGGCCTGGGTCACCTGCTGCTGCTTCTGCGTGGACGGTGTCGCCTCGTGTGCTCGTGCTCGTGGCTCTGTATCCGTGGCACTGTCTCCGTGGCACTCTGCTCCCTTGGCTTGCCTGTGGCCCATAGCCCCAGCCCTCCTGTCTGAGCTTGAGGCCCTGGGACTTGGGTGGAGCTGGTTTGAGGCCCGACAGGCTGGGAAGAACCAGCTGCTCTTGCTGAGGGTCTGGGGCCGGGACTGTGGCCTGACATGCTGGGCCCCTCCGGCTGGGCGCTTCCCCAAACTCACCTCCTGGGCGGCTGGCGACCTGCATGGCCCCTGATGCCTTTCCTGGGACTGGGGGCCACGTACCATCCCATTCCCACCTCCCTCTAGGGCAGGCTCCAGGGGTCCCTACTGGGAAGTCTGATGTGGGCAGGTAGTGCAGCTGCTGGGCGTCTCCTGCGCCCCTGGGACGCCTGGAGCCTGCTGAGTGCTGCGTGGAGTAGATTCCCTGGGCCCCAGGGCTTCGCTGCTTTGGGCTGAAGCACCCCACTAGAAGGGTGTCTCCTTAGCCTGGAGGGAGGGACATACACGGAGCCCGCCCCACACCACCCTGCCCCTCCAGACCCCCCTGACCAAGCTTTCCTTTCTGCCCCCACCCACGCTGCCTCCGTAGTTAGGAACTGAGAGCGGCGAGTGACAGGTAACGGGGCCCAGCCCCGGTGTCCCGTGCTGTCCCAGCCCAAGGAGGGCCCCGTGTGCGGCACAGGGCGTGGACTGGGCCCCAGCAGCAGCAGGGTGGGGACACCGAGTGTGCCGCGCCCGGGGGATGCCTCGGGGTGGGAGCTGGGCCTGGCGACCCTCGGCACAGGGCACCGGGGACACCACCCTGATCCGACTCCTCTCCGCCTCTCTCCCTGCCTCCCTCTCTCTCTTCTGCTTCTCCCTCTGGCTCTCTCTCACTCCCCCACCTCCCCACAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCCCTT +>ENST00000462379 +GGTGGGGGCCAGCCCCACACAGGCGGGAGGGGTGGGAGTTGGGGGCGGGCCGGGCATCGCGATGGGCCCTGATGCCACCCCCACTCCTGTGTCCCAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACGGGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAGGCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGTTAGGAACTGAGAGCGGCGAGTGACAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCCCTT +>ENST00000511072 +GGTGTCCAAACTGACAATGCTGGGGAGATGAAGATAGTGTGTGGCTGCTTCTGGACTCAAGGAGGAGGAGAGAGATTCCGCGAGCCGACACCATGCGATCCAAGGCGAGGGCGAGGAAGCTAGCCAAAAGTGACGGTGACGTTGTAAATAATATGTATGAGCCCAACCGGGACCTGCTGGCCAGCCACAGCGCGGAGGACGAGGCCGAGGACAGTGCCATGTCGCCCATCCCCGTGGGGCCACCGTCCCCCTTCCCCACCAGCGAGGACTTCACCCCCAAGGAGGGCTCGCCGTACGAGGCCCCTGTCTACATTCCTGAAGACATTCCGATCCCAGCAGACTTCGAGCTCCGAGAGTCCTCCATCCCAGGGGCTGGCCTGGGGGTCTGGGCCAAGAGGAAGATGGAAGCCGGGGAGAGGCTGGGCCCCTGCGTGGTGGTGCCCCGGGCGGCGGCAAAGGAGACAGACTTCGGATGGGAGCAAATACTGACGGACGTGGAAGTGTCGCCCCAGGAAGGCTGCATCACAAAGCAGATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAGATTTACTATAAAGTCATTAAGGACATTGAGCCAGGTGAGGAGCTGCTGGTGCACGTGAAGGAAGGCGTCTACCCCCTGGGCACAGTGCCGCCCGGCCTGGACGAGGAGCCCACGTTCCGCTGTGACGAGTGTGACGAACTCTTCCAGTCCAAGCTGGACCTGCGGCGCCATAAGAAGTACACGTGTGGCTCAGTGGGGGCTGCGCTCTACGAGGGCCTGGCTGAGGAGCTCAAGCCCGAGGGCCTTGGCGGTGGCAGCGGCCAAGCCCACGAGTGCAAGGACTGCGAGCGGATGTTCCCCAACAAGTACAGCCTGGAGCAGCACATGGTCATCCACACGGAGGAGCGCGAGTACAAATGCGACCAGTGTCCCAAGGCCTTCAACTGGAAGTCCAACCTCATCCGCCACCAGATGTCCCACGACAGCGGCAAACGCTTCGAATGTGAAAACTGCGTGAAGGTGTTCACGGACCCCAGCAACCTTCAGCGGCACATCCGCTCGCAGCACGTGGGCGCTCGGGCCCACGCCTGCCCCGACTGCGGGAAGACCTTCGCCACGTCCTCCGGCCTCAAGCAGCACAAGCATATCCACAGCACGGTGAAGCCTTTCATATGTGAGGTCTGCCACAAGTCCTACACGCAGTTCTCCAACCTGTGCCGGCACAAGCGGATGCACGCCGACTGCCGCACGCAGATCAAGTGCAAGGACTGTGGCCAGATGTTCAGCACTACCTCCTCCCTCAACAAGCACCGGCGCTTCTGCGAGGGCAAGAACCATTACACGCCGGGCGGCATCTTTGCCCCGGGCCTGCCCTTGACCCCCAGCCCCATGATGGACAAGGCAAAACCCTCCCCCAGCCTCAATCACGCCAGCCTGGGCTTCAACGAGTACTTTCCCTCCAGGCCGCACCCGGGGAGCCTGCCCTTCTCCACGGCGCCTCCCACGTTCCCCGCACTCACCCCCGGCTTCCCGGGCATCTTCCCTCCATCCTTGTACCCCCGGCCGCCTCTGCTACCTCCCACATCGCTGCTCAAGAGCCCCCTGAACCACACCCAGGACGCCAAGCTCCCCAGTCCCCTGGGGAACCCAGCCCTGCCCCTGGTCTCCGCCGTCAGCAACAGCAGCCAGGGCACGACGGCAGCTGCGGGGCCCGAGGAGAAGTTCGAGAGCCGCCTGGAGGACTCCTGTGTGGAGAAGCTGAAGACCAGGAGCAGCGACATGTCGGACGGCAGTGACTTTGAGGACGTCAACACCACCACGGGGACCGACCTGGACACGACCACGGGGACGGGCTCGGACCTGGACAGCGACGTGGACAGCGACCCTGACAAGGACAAGGGCAAGGGCAAGTCCGCCGAGGGCCAGCCCAAGTTTGGGGGCGGCTTGGCGCCCCCGGGGGCCCCGAACAGCGTGGCCGAGGTGCCTGTCTTCTATTCCCAGCACTCATTCTTCCCGCCACCCGACGAGCAGCTGCTGACTGCAACGGGCGCCGCCGGGGACTCCATCAAGGCCATCGCATCCATTGCCGAGAAGTACTTTGGCCCCGGCTTCATGGGGATGCAGGAGAAGAAGCTGGGCTCGCTCCCCTACCACTCGGCGTTCCCCTTCCAGTTCCTGCCCAACTTCCCCCACTCCCTTTACCCCTTCACGGACCGAGCCCTCGCCCACAACTTGCTGGTCAAGGCCGAGCCAAAGTCACCCCGGGACGCCCTCAAGGTGGGCGGCCCCAGTGCCGAGTGCCCCTTTGATCTCACCACCAAGCCCAAAGACGTGAAGCCCATCCTGCCCATGCCCAAGGGCCCCTCGGCCCCCGCATCCGGCGAGGAGCAGCCGCTGGACCTGAGCATCGGCAGCCGGGCCCGTGCCAGCCAAAACGGCGGCGGGCGGGAGCCCCGCAAGAACCACGTCTATGGGGAACGCAAGCTGGGCGCCGGCGAGGGGCTGCCCCAGGTGTGCCCGGCGCGGATGCCCCAGCAGCCCCCGCTCCACTACGCCAAGCCCTCGCCCTTCTTCATGGACCCCATCTACAGCAGGGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAGATGTCAGCCATAGAGACCATGACAGAGAAGCTGGAGAGCTTTGCAGCCATGAAGGCGGACTCGGGCAGCTCCCTGCAGCCCCTCCCCCACCACCCCTTCAACTTCCGGTCCCCACCCCCAACGCTCTCCGACCCCATCCTCAGGAAGGGCAAGGAGCGATACACGTGCAGGTACTGTGGGAAGATCTTCCCCAGATCAGCCAATCTCACCAGACACCTGAGGACGCACACTGGGGAGCAGCCGTACAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACGGGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAGGCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAATCAGCCAGTGGGCAGGTGGACGCTCTGCTGAGACAGAAGCTGGTGGCCACTGCCGGGTGCCCGCGTGGGGTCGCGGAAGGGAATGGATAGACTGGTGTGCTCAAAAGAGAGAGATCACTCAAATGATTTTTATAATGAAATGACAAGAATAACCCTTTTGGTAACCGTATTGACTGCAGAGTCTATTTAAGCATGTGGTTTTAAAAATAGACAGTATTTTTTAAAAATCAAAAAATGACTTGCAAAT +>ENST00000607632 +AATGCTGGGGAGATGAAGATAGTGTGTGGCTGCTTCTGGACTCAAGGAGGAGGAGAGAGATTCCGCGAGCCGACACCATGCGATCCAAGGCGAGGGCGAGGAAGCTAGCCAAAAGTGACGGTGACGTTGTAAATAATATGTATGAGCCCAACCGGGACCTGCTGGCCAGCCACAGCGCGGAGGACGAGGCCGAGGACAGTGCCATGTCGCCCATCCCCGTGGGGCCACCGTCCCCCTTCCCCACCAGCGAGGACTTCACCCCCAAGGAGGGCTCGCCGTACGAGGCCCCTGTCTACATTCCTGAAGACATTCCGATCCCAGCAGACTTCGAGCTCCGAGAGTCCTCCATCCCAGGGGCTGGCCTGGGGGTCTGGGCCAAGAGGAAGATGGAAGCCGGGGAGAGGCTGGGCCCCTGCGTGGTGGTGCCCCGGGCGGCGGCAAAGGAGACAGACTTCGGATGGGAGGTGAGCGATCGCGCCTGAGTATGATTGATCACGGCCATTTATCTTGTGTTCAATCTATTTATAAAGCCGGGCTGAGCAGCCACTGCCCGAGGCGGGAGGCGCGGCCAGAGAGAGCGT +>ENST00000378391 +GAAGATAGTGTGTGGCTGCTTCTGGACTCAAGGAGGAGGAGAGAGATTCCGCGAGCCGACACCATGCGATCCAAGGCGAGGGCGAGGAAGCTAGCCAAAAGTGACGGTGACGTTGTAAATAATATGTATGAGCCCAACCGGGACCTGCTGGCCAGCCACAGCGCGGAGGACGAGGCCGAGGACAGTGCCATGTCGCCCATCCCCGTGGGGCCACCGTCCCCCTTCCCCACCAGCGAGGACTTCACCCCCAAGGAGGGCTCGCCGTACGAGGCCCCTGTCTACATTCCTGAAGACATTCCGATCCCAGCAGACTTCGAGCTCCGAGAGTCCTCCATCCCAGGGGCTGGCCTGGGGGTCTGGGCCAAGAGGAAGATGGAAGCCGGGGAGAGGCTGGGCCCCTGCGTGGTGGTGCCCCGGGCGGCGGCAAAGGAGACAGACTTCGGATGGGAGCAAATACTGACGGACGTGGAAGTGTCGCCCCAGGAAGGCTGCATCACAAAGATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAGATTTACTATAAAGTCATTAAGGACATTGAGCCAGGTGAGGAGCTGCTGGTGCACGTGAAGGAAGGCGTCTACCCCCTGGGCACAGTGCCGCCCGGCCTGGACGAGGAGCCCACGTTCCGCTGTGACGAGTGTGACGAACTCTTCCAGTCCAAGCTGGACCTGCGGCGCCATAAGAAGTACACGTGTGGCTCAGTGGGGGCTGCGCTCTACGAGGGCCTGGCTGAGGAGCTCAAGCCCGAGGGCCTTGGCGGTGGCAGCGGCCAAGCCCACGAGTGCAAGGACTGCGAGCGGATGTTCCCCAACAAGTACAGCCTGGAGCAGCACATGGTCATCCACACGGAGGAGCGCGAGTACAAATGCGACCAGTGTCCCAAGGCCTTCAACTGGAAGTCCAACCTCATCCGCCACCAGATGTCCCACGACAGCGGCAAACGCTTCGAATGTGAAAACTGCGTGAAGGTGTTCACGGACCCCAGCAACCTTCAGCGGCACATCCGCTCGCAGCACGTGGGCGCTCGGGCCCACGCCTGCCCCGACTGCGGGAAGACCTTCGCCACGTCCTCCGGCCTCAAGCAGCACAAGCATATCCACAGCACGGTGAAGCCTTTCATATGTGAGGTCTGCCACAAGTCCTACACGCAGTTCTCCAACCTGTGCCGGCACAAGCGGATGCACGCCGACTGCCGCACGCAGATCAAGTGCAAGGACTGTGGCCAGATGTTCAGCACTACCTCCTCCCTCAACAAGCACCGGCGCTTCTGCGAGGGCAAGAACCATTACACGCCGGGCGGCATCTTTGCCCCGGGCCTGCCCTTGACCCCCAGCCCCATGATGGACAAGGCAAAACCCTCCCCCAGCCTCAATCACGCCAGCCTGGGCTTCAACGAGTACTTTCCCTCCAGGCCGCACCCGGGGAGCCTGCCCTTCTCCACGGCGCCTCCCACGTTCCCCGCACTCACCCCCGGCTTCCCGGGCATCTTCCCTCCATCCTTGTACCCCCGGCCGCCTCTGCTACCTCCCACATCGCTGCTCAAGAGCCCCCTGAACCACACCCAGGACGCCAAGCTCCCCAGTCCCCTGGGGAACCCAGCCCTGCCCCTGGTCTCCGCCGTCAGCAACAGCAGCCAGGGCACGACGGCAGCTGCGGGGCCCGAGGAGAAGTTCGAGAGCCGCCTGGAGGACTCCTGTGTGGAGAAGCTGAAGACCAGGAGCAGCGACATGTCGGACGGCAGTGACTTTGAGGACGTCAACACCACCACGGGGACCGACCTGGACACGACCACGGGGACGGGCTCGGACCTGGACAGCGACGTGGACAGCGACCCTGACAAGGACAAGGGCAAGGGCAAGTCCGCCGAGGGCCAGCCCAAGTTTGGGGGCGGCTTGGCGCCCCCGGGGGCCCCGAACAGCGTGGCCGAGGTGCCTGTCTTCTATTCCCAGCACTCATTCTTCCCGCCACCCGACGAGCAGCTGCTGACTGCAACGGGCGCCGCCGGGGACTCCATCAAGGCCATCGCATCCATTGCCGAGAAGTACTTTGGCCCCGGCTTCATGGGGATGCAGGAGAAGAAGCTGGGCTCGCTCCCCTACCACTCGGCGTTCCCCTTCCAGTTCCTGCCCAACTTCCCCCACTCCCTTTACCCCTTCACGGACCGAGCCCTCGCCCACAACTTGCTGGTCAAGGCCGAGCCAAAGTCACCCCGGGACGCCCTCAAGGTGGGCGGCCCCAGTGCCGAGTGCCCCTTTGATCTCACCACCAAGCCCAAAGACGTGAAGCCCATCCTGCCCATGCCCAAGGGCCCCTCGGCCCCCGCATCCGGCGAGGAGCAGCCGCTGGACCTGAGCATCGGCAGCCGGGCCCGTGCCAGCCAAAACGGCGGCGGGCGGGAGCCCCGCAAGAACCACGTCTATGGGGAACGCAAGCTGGGCGCCGGCGAGGGGCTGCCCCAGGTGTGCCCGGCGCGGATGCCCCAGCAGCCCCCGCTCCACTACGCCAAGCCCTCGCCCTTCTTCATGGACCCCATCTACAGCAGGGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAGATGTCAGCCATAGAGACCATGACAGAGAAGCTGGAGAGCTTTGCAGCCATGAAGGCGGACTCGGGCAGCTCCCTGCAGCCCCTCCCCCACCACCCCTTCAACTTCCGGTCCCCACCCCCAACGCTCTCCGACCCCATCCTCAGGAAGGGCAAGGAGCGATACACGTGCAGGTACTGTGGGAAGATCTTCCCCAGATCAGCCAATCTCACCAGACACCTGAGGACGCACACTGGGGAGCAGCCGTACAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACGGGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAGGTGTGCTGAGGACCACGAAGGCGGTCTGTTAGCTTTGGAGCCGATGCCGACTTTTGGGAAGGGGCTGGACCTCCGCAGAGCAGCTGAGGAAGCATTTGAAGTTAAAGATGTGCTTAATTCCACCTTAGATTCTGAGGCTTTAAAACATACACTGTGCAGGCAGGCTAAGAACCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAATCAGCCAGTGGGCAGGTGGACGCTCTGCTGAGACAGAAGCTGGTGGCCACTGCCGGGTGCCCGCGTGGGGTCGCGGAAGGGAATGGATAGACTGGTGTGCTCAAAAGAGAGAGATCACTCAAATGATTTTTATAATGAAATGACAAGAATAACCCTTTTGGTAACCGTATTGACTGCAGAGTCTATTTAAGCATGTGGTTTTAAAAATAGACAGTATTTTTTAAAAATCAAAAAATGACTTGCAAATTGTTTTTTAAAAGTAATTTTGCATTGCTTTGAAATTTGAGCTCATTTGCAAACCCGAGTCTGCCTGGGAACCCGCACTGTGCCTGGGTGTATTCTTTATACTGTAGATAATGGAGAAATTTTCTATCTCTGTCCCTATTTGTATAAGCCAAGGTGATGCTGGGTGCCCCGAGGCAGAACAAGAGGCGCGGGGCCACACCCGTGAACCATGCAGACGGCCGAAGAAGTCTTAGGCAGGGCGCCCTGGGCTGCAGGCCTGCCCGAGGCTGGGATGGGAAGTGTGCCTGCCCTCGTGTGACATGGAATTGGTGTCAGGACCGCCACGTGGCCTTCAGAGGAATCCACAGGTCCCCACCCAAGATCCCTCAATTATATGGGGAAGTCGAGGGCCTGTGGCTTGGATCCGCCATGCAGAGATGTGGCCGGGCACCCATCTTCCTTCCCTCCTCTGTCCCTGCCTCGGCCACCCCACGCGGGAACCCAGCGCCGTCCTCTGAAGGCAGGGCCTTGGCCACGTCCTGGGTCTCCCACCTCCCACCTGACCCCAGCGGCTCCGGTGTCCTCCACGTGGCTGCCCTGGGGAGCAATCCCAGCGGATCGCTCCGGGCCACCAAGCCGCACCTGTGCCTGAGACTCCGGATGGACGACACAGTCGTCACGTCGCTCTTCCTGCGGGTTCTTGGCGAGACACAGCTTGAGAACAGAAGGGCGTCGGGGGAACCTGCCGCAAGGAGCAGAGACAGCACAGCCCCCCGGGCCCAGCCGCCTCCCTCTCTTGGGACGCAACTTCTTCCCCACTCGGATGGGCTTTAAATTATTCCCATAGGGGCCAATTTCAAATAATAATTTTTTTCCCTGATGGAATTTACCTTAATCTGTATATAACTTGTAATTTTTTCTAATTCATTTCTTTTCTTATTTTATTTCCTCCTTAACAGTATTTTTGGCATTAGACATTCTTATTGTGAAGAAATAATGTTAATATAAGTATCTGGTGAAGGACCAAAACCGTGTGATAAGGTTGTGTGTCGTGTGGGAGTGGGGCGATTTTTTATGTGCCAAATACCCCCGTCCCCCCCA +>ENST00000514189 +GCTGCTTCTGGACTCAAGGAGGAGGAGAGAGATTCCGCGAGCCGACACCATGCGATCCAAGGCGAGGGCGAGGAAGCTAGCCAAAAGTGACGGTGACGTTGTAAATAATATGTATGAGCCCAACCGGGACCTGCTGGCCAGCCACAGCGCGGAGGACGAGGCCGAGGACAGTGCCATGTCGCCCATCCCCGTGGGGCCACCGTCCCCCTTCCCCACCAGCGAGGACTTCACCCCCAAGGAGGGCTCGCCGTACGAGGCCCCTGTCTACATTCCTGAAGACATTCCGATCCCAGCAGACTTCGAGCTCCGAGAGTCCTCCATCCCAGGGGCTGGCCTGGGGGTCTGGGCCAAGAGGAAGATGGAAGCCGGGGAGAGGCTGGGCCCCTGCGTGGTGGTGCCCCGGGCGGCGGCAAAGGAGACAGACTTCGGATGGGAGCAAATACTGACGGACGTGGAAGTGTCGCCCCAGGAAGGCTGCATCACAAAGCAGATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAGATTTACTATAAAGTCATTAAGGACATTGAGCCAGGTGAGGAGCTGCTGGTGCACGTGAAGGAAGGCGTCTACCCCCTGGGCACAGTGCCGCCCGGCCTGGACGAGGAGCCCACGTTCCGCTGTGACGAGTGTGACGAACTCTTCCAGTCCAAGCTGGACCTGCGGCGCCATAAGAAGTACACGTGTGGCTCAGTGGGGGCTGCGCTCTACGAGGGCCTGGCTGAGGAGCTCAAGCCCGAGGGCCTTGGCGGTGGCAGCGGCCAAGCCCACGAGTGCAAGGACTGCGAGCGGATGTTCCCCAACAAGTACAGCCTGGAGCAGCACATGGTCATCCACACGGAGGAGCGCGAGTACAAATGCGACCAGTGTCCCAAGGCCTTCAACTGGAAGTCCAACCTCATCCGCCACCAGATGTCCCACGACAGCGGCAAACGCTTCGAATGTGAAAACTGCGTGAAGGTGTTCACGGACCCCAGCAACCTTCAGCGGCACATCCGCTCGCAGCACGTGGGCGCTCGGGCCCACGCCTGCCCCGACTGCGGGAAGACCTTCGCCACGTCCTCCGGCCTCAAGCAGCACAAGCATATCCACAGCACGGTGAAGCCTTTCATATGTGAGGTCTGCCACAAGTCCTACACGCAGTTCTCCAACCTGTGCCGGCACAAGCGGATGCACGCCGACTGCCGCACGCAGATCAAGTGCAAGGACTGTGGCCAGATGTTCAGCACTACCTCCTCCCTCAACAAGCACCGGCGCTTCTGCGAGGGCAAGAACCATTACACGCCGGGCGGCATCTTTGCCCCGGGCCTGCCCTTGACCCCCAGCCCCATGATGGACAAGGCAAAACCCTCCCCCAGCCTCAATCACGCCAGCCTGGGCTTCAACGAGTACTTTCCCTCCAGGCCGCACCCGGGGAGCCTGCCCTTCTCCACGGCGCCTCCCACGTTCCCCGCACTCACCCCCGGCTTCCCGGGCATCTTCCCTCCATCCTTGTACCCCCGGCCGCCTCTGCTACCTCCCACATCGCTGCTCAAGAGCCCCCTGAACCACACCCAGGACGCCAAGCTCCCCAGTCCCCTGGGGAACCCAGCCCTGCCCCTGGTCTCCGCCGTCAGCAACAGCAGCCAGGGCACGACGGCAGCTGCGGGGCCCGAGGAGAAGTTCGAGAGCCGCCTGGAGGACTCCTGTGTGGAGAAGCTGAAGACCAGGAGCAGCGACATGTCGGACGGCAGTGACTTTGAGGACGTCAACACCACCACGGGGACCGACCTGGACACGACCACGGGGACGGGCTCGGACCTGGACAGCGACGTGGACAGCGACCCTGACAAGGACAAGGGCAAGGGCAAGTCCGCCGAGGGCCAGCCCAAGTTTGGGGGCGGCTTGGCGCCCCCGGGGGCCCCGAACAGCGTGGCCGAGGTGCCTGTCTTCTATTCCCAGCACTCATTCTTCCCGCCACCCGACGAGCAGCTGCTGACTGCAACGGGCGCCGCCGGGGACTCCATCAAGGCCATCGCATCCATTGCCGAGAAGTACTTTGGCCCCGGCTTCATGGGGATGCAGGAGAAGAAGCTGGGCTCGCTCCCCTACCACTCGGCGTTCCCCTTCCAGTTCCTGCCCAACTTCCCCCACTCCCTTTACCCCTTCACGGACCGAGCCCTCGCCCACAACTTGCTGGTCAAGGCCGAGCCAAAGTCACCCCGGGACGCCCTCAAGGTGGGCGGCCCCAGTGCCGAGTGCCCCTTTGATCTCACCACCAAGCCCAAAGACGTGAAGCCCATCCTGCCCATGCCCAAGGGCCCCTCGGCCCCCGCATCCGGCGAGGAGCAGCCGCTGGACCTGAGCATCGGCAGCCGGGCCCGTGCCAGCCAAAACGGCGGCGGGCGGGAGCCCCGCAAGAACCACGTCTATGGGGAACGCAAGCTGGGCGCCGGCGAGGGGCTGCCCCAGGTGTGCCCGGCGCGGATGCCCCAGCAGCCCCCGCTCCACTACGCCAAGCCCTCGCCCTTCTTCATGGACCCCATCTACAGGGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAGATGTCAGCCATAGAGACCATGACAGAGAAGCTGGAGAGCTTTGCAGCCATGAAGGCGGACTCGGGCAGCTCCCTGCAGCCCCTCCCCCACCACCCCTTCAACTTCCGGTCCCCACCCCCAACGCTCTCCGACCCCATCCTCAGGAAGGGCAAGGAGCGATACACGTGCAGGTACTGTGGGAAGATCTTCCCCAGATCAGCCAATCTCACCAGACACCTGAGGACGCACACTGGGGAGCAGCCGTACAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACGGGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAGGCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAATCAGCCAGTGGGCAGGTGGACGCTCTGCTGAGACAGAAGCTGGTGGCCACTGCCGGGTGCCCGCGTGGGGTCGCGGAAGGGAATGGATAGACTGGTGTGCTCAAAAGAGAGAGATCACTCAAATGATTTTTATAATGAAATGACAAGAATAACCCTTTTGGTAACCGTATTGACTGCAGAGTCTATTTAAGCATGTGGTTTTAAAAATAGACAGTATTTTTTAAAAATCAAAAAATGACTTGCAAAT +>ENST00000270722 +GCTGCTTCTGGACTCAAGGAGGAGGAGAGAGATTCCGCGAGCCGACACCATGCGATCCAAGGCGAGGGCGAGGAAGCTAGCCAAAAGTGACGGTGACGTTGTAAATAATATGTATGAGCCCAACCGGGACCTGCTGGCCAGCCACAGCGCGGAGGACGAGGCCGAGGACAGTGCCATGTCGCCCATCCCCGTGGGGCCACCGTCCCCCTTCCCCACCAGCGAGGACTTCACCCCCAAGGAGGGCTCGCCGTACGAGGCCCCTGTCTACATTCCTGAAGACATTCCGATCCCAGCAGACTTCGAGCTCCGAGAGTCCTCCATCCCAGGGGCTGGCCTGGGGGTCTGGGCCAAGAGGAAGATGGAAGCCGGGGAGAGGCTGGGCCCCTGCGTGGTGGTGCCCCGGGCGGCGGCAAAGGAGACAGACTTCGGATGGGAGCAAATACTGACGGACGTGGAAGTGTCGCCCCAGGAAGGCTGCATCACAAAGATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAGATTTACTATAAAGTCATTAAGGACATTGAGCCAGGTGAGGAGCTGCTGGTGCACGTGAAGGAAGGCGTCTACCCCCTGGGCACAGTGCCGCCCGGCCTGGACGAGGAGCCCACGTTCCGCTGTGACGAGTGTGACGAACTCTTCCAGTCCAAGCTGGACCTGCGGCGCCATAAGAAGTACACGTGTGGCTCAGTGGGGGCTGCGCTCTACGAGGGCCTGGCTGAGGAGCTCAAGCCCGAGGGCCTTGGCGGTGGCAGCGGCCAAGCCCACGAGTGCAAGGACTGCGAGCGGATGTTCCCCAACAAGTACAGCCTGGAGCAGCACATGGTCATCCACACGGAGGAGCGCGAGTACAAATGCGACCAGTGTCCCAAGGCCTTCAACTGGAAGTCCAACCTCATCCGCCACCAGATGTCCCACGACAGCGGCAAACGCTTCGAATGTGAAAACTGCGTGAAGGTGTTCACGGACCCCAGCAACCTTCAGCGGCACATCCGCTCGCAGCACGTGGGCGCTCGGGCCCACGCCTGCCCCGACTGCGGGAAGACCTTCGCCACGTCCTCCGGCCTCAAGCAGCACAAGCATATCCACAGCACGGTGAAGCCTTTCATATGTGAGGTCTGCCACAAGTCCTACACGCAGTTCTCCAACCTGTGCCGGCACAAGCGGATGCACGCCGACTGCCGCACGCAGATCAAGTGCAAGGACTGTGGCCAGATGTTCAGCACTACCTCCTCCCTCAACAAGCACCGGCGCTTCTGCGAGGGCAAGAACCATTACACGCCGGGCGGCATCTTTGCCCCGGGCCTGCCCTTGACCCCCAGCCCCATGATGGACAAGGCAAAACCCTCCCCCAGCCTCAATCACGCCAGCCTGGGCTTCAACGAGTACTTTCCCTCCAGGCCGCACCCGGGGAGCCTGCCCTTCTCCACGGCGCCTCCCACGTTCCCCGCACTCACCCCCGGCTTCCCGGGCATCTTCCCTCCATCCTTGTACCCCCGGCCGCCTCTGCTACCTCCCACATCGCTGCTCAAGAGCCCCCTGAACCACACCCAGGACGCCAAGCTCCCCAGTCCCCTGGGGAACCCAGCCCTGCCCCTGGTCTCCGCCGTCAGCAACAGCAGCCAGGGCACGACGGCAGCTGCGGGGCCCGAGGAGAAGTTCGAGAGCCGCCTGGAGGACTCCTGTGTGGAGAAGCTGAAGACCAGGAGCAGCGACATGTCGGACGGCAGTGACTTTGAGGACGTCAACACCACCACGGGGACCGACCTGGACACGACCACGGGGACGGGCTCGGACCTGGACAGCGACGTGGACAGCGACCCTGACAAGGACAAGGGCAAGGGCAAGTCCGCCGAGGGCCAGCCCAAGTTTGGGGGCGGCTTGGCGCCCCCGGGGGCCCCGAACAGCGTGGCCGAGGTGCCTGTCTTCTATTCCCAGCACTCATTCTTCCCGCCACCCGACGAGCAGCTGCTGACTGCAACGGGCGCCGCCGGGGACTCCATCAAGGCCATCGCATCCATTGCCGAGAAGTACTTTGGCCCCGGCTTCATGGGGATGCAGGAGAAGAAGCTGGGCTCGCTCCCCTACCACTCGGCGTTCCCCTTCCAGTTCCTGCCCAACTTCCCCCACTCCCTTTACCCCTTCACGGACCGAGCCCTCGCCCACAACTTGCTGGTCAAGGCCGAGCCAAAGTCACCCCGGGACGCCCTCAAGGTGGGCGGCCCCAGTGCCGAGTGCCCCTTTGATCTCACCACCAAGCCCAAAGACGTGAAGCCCATCCTGCCCATGCCCAAGGGCCCCTCGGCCCCCGCATCCGGCGAGGAGCAGCCGCTGGACCTGAGCATCGGCAGCCGGGCCCGTGCCAGCCAAAACGGCGGCGGGCGGGAGCCCCGCAAGAACCACGTCTATGGGGAACGCAAGCTGGGCGCCGGCGAGGGGCTGCCCCAGGTGTGCCCGGCGCGGATGCCCCAGCAGCCCCCGCTCCACTACGCCAAGCCCTCGCCCTTCTTCATGGACCCCATCTACAGCAGGGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAGATGTCAGCCATAGAGACCATGACAGAGAAGCTGGAGAGCTTTGCAGCCATGAAGGCGGACTCGGGCAGCTCCCTGCAGCCCCTCCCCCACCACCCCTTCAACTTCCGGTCCCCACCCCCAACGCTCTCCGACCCCATCCTCAGGAAGGGCAAGGAGCGATACACGTGCAGGTACTGTGGGAAGATCTTCCCCAGATCAGCCAATCTCACCAGACACCTGAGGACGCACACTGGGGAGCAGCCGTACAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACGGGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAGGTGTGCTGAGGACCACGAAGGCGGTCTGTTAGCTTTGGAGCCGATGCCGACTTTTGGGAAGGGGCTGGACCTCCGCAGAGCAGCTGAGGAAGCATTTGAAGTTAAAGATGTGCTTAATTCCACCTTAGATTCTGAGGCTTTAAAACATACACTGTGCAGGCAGGCTAAGAACCAGGCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAATCAGCCAGTGGGCAGGTGGACGCTCTGCTGAGACAGAAGCTGGTGGCCACTGCCGGGTGCCCGCGTGGGGTCGCGGAAGGGAATGGATAGACTGGTGTGCTCAAAAGAGAGAGATCACTCAAATGATTTTTATAATGAAATGACAAGAATAACCCTTTTGGTAACCGTATTGACTGCAGAGTCTATTTAAGCATGTGGTTTTAAAAATAGACAGTATTTTTTAAAAATCAAAAAATGACTTGCAAATTGTTTTTTAAAAGTAATTTTGCATTGCTTTGAAATTTGAGCTCATTTGCAAACCCGAGTCTGCCTGGGAACCCGCACTGTGCCTGGGTGTATTCTTTATACTGTAGATAATGGAGAAATTTTCTATCTCTGTCCCTATTTGTATAAGCCAAGGTGATGCTGGGTGCCCCGAGGCAGAACAAGAGGCGCGGGGCCACACCCGTGAACCATGCAGACGGCCGAAGAAGTCTTAGGCAGGGCGCCCTGGGCTGCAGGCCTGCCCGAGGCTGGGATGGGAAGTGTGCCTGCCCTCGTGTGACATGGAATTGGTGTCAGGACCGCCACGTGGCCTTCAGAGGAATCCACAGGTCCCCACCCAAGATCCCTCAATTATATGGGGAAGTCGAGGGCCTGTGGCTTGGATCCGCCATGCAGAGATGTGGCCGGGCACCCATCTTCCTTCCCTCCTCTGTCCCTGCCTCGGCCACCCCACGCGGGAACCCAGCGCCGTCCTCTGAAGGCAGGGCCTTGGCCACGTCCTGGGTCTCCCACCTCCCACCTGACCCCAGCGGCTCCGGTGTCCTCCACGTGGCTGCCCTGGGGAGCAATCCCAGCGGATCGCTCCGGGCCACCAAGCCGCACCTGTGCCTGAGACTCCGGATGGACGACACAGTCGTCACGTCGCTCTTCCTGCGGGTTCTTGGCGAGACACAGCTTGAGAACAGAAGGGCGTCGGGGGAACCTGCCGCAAGGAGCAGAGACAGCACAGCCCCCCGGGCCCAGCCGCCTCCCTCTCTTGGGACGCAACTTCTTCCCCACTCGGATGGGCTTTAAATTATTCCCATAGGGGCCAATTTCAAATAATAATTTTTTTCCCTGATGGAATTTACCTTAATCTGTATATAACTTGTAATTTTTTCTAATTCATTTCTTTTCTTATTTTATTTCCTCCTTAACAGTATTTTTGGCATTAGACATTCTTATTGTGAAGAAATAATGTTAATATAAGTATCTGGTGAAGGACCAAAACCGTGTGATAAGGTTGTGTGTCGTGTGGGAGTGGGGCGATTTTTTATGTGCCAAATACCCCCGTCCCCCCCATGAATCCTGCTGTCCCTGCTGCCGTTTACCAGACAATCATATGTTTTTGTTAAATTTGCGTTTCAGTTACATTTGCATTTAAGACAAGTGTTCTATTTATTTCTTGTATTGTTTGGAAGAAAAAATGATGATAGAGTCCCAAAAAGAAGAGAAAAAAAATGCCCAAGTTGCCCTTTAAAAAAAAAGAGCGTAAATACAAACAGGAGTGGTGCAAGCCGCCTTGGTGTGGGTTTGTGTCACGTGTGGACATCTCCTCAGGCTTTGTGTCACGCGTGGACATCTCCTCAGGCTGTCCCCAGCGGTGACGGGAGGTGTCCTGGCTGCTCCAGGACAAAAGACAATCGTCTCTGTGGGTGCCGGGTGGTCCAGGCTTGCACTGAAGACGTGCCACGGGGAGGCTCCTGCAGGAGGCTCAACCCGACGGATCACAGTGAAAGGGATTCCTCCCACGCCAGATCTGCACAACGAGGCAAGACAGGACCCACCTGTGCGTGCGCTGGGGCCATGGGGTGGCCCCGCCGGGGCAGCGGGGGAGCTGCCTGCAGAAGAGCCAGCTGGCGTGTCGGGAAGGATCCAGGATCTGCAAACACAACTGCTCAGGCCTTCTCACGCGTTTCCACAACATCCCCTGGGTCAGACCCACCAGGTACCCCGTAGGAATTTCCAGTTTCCCTTGATCTAGATGGGATTCTTATAAAAATTCAACCTCAGACATAAACACCCCATTTCTGTAAACCCAAATTATATGGTTTCTTCTGCGAAAGAGTAAGGTGTGTGCTTTTTTTTTTTTGCAATATGACCCCGTCTCTCTGAAGTGGGACATTCGGACGGATGGAGCCCTCAGCGTGTCTTTTCAGCAGGAGCAGAACCGATGAGAGCCGCCCTTACCGTTGGTCTCCGGATCCCCCAGTCCCATCCCGCCGTTTTCGGCTGTCTTCCTAACCGTCCTGTCTTCTCTTGGCGCTCTTTCCTTCCACCTTTCCCAAGAGTCCTGGTTGCACGTTTTAAGTCATATATTTTCGTCCCCCTGAAAATGATGGCAAGCCCAGTTTCTCCTGAGCATTCAGACCCCCAGGCCCCAGCACTTGGCGTTTTCAGGAGGCCCTGTTCTTAGAGCCCCTGACAAAGGCAGCACTTATTTCCTGGGCTGGTGCGCCCCAAAACACGGCCCCGACACTTAGTGTGGCCCCAGGCCCCAGCGAGCCTCGCCCTCCCAGTTTTGCTCTGCCCAGCAGTGTTGGTGCCCAGAGATGACAAGGGCCAGGGAGCCTGGCCCGGGTGTGAGAATTCAGAGATTCTGGCCTCCAGCTGTCACCACACCGTAACGGGGCCATGTAACTGTGCAGCATGGACAGGGATGCGACGGGGCAGCTGGCTGTGTCCATGGCCAGGTGGCCAGGGTCAGGGCTGCAAGCCAGGGGTCCAGGGCCCTTCCGTTCAGCCCAAATGCTGCCCCAATGCTAACTCCTTGGATTGTCAACCCCCATCCCCCAAATGGAAATTCCGAAGGAGGCCTCCTCGCACCTGCCCTCCGCTGCTCCTCAGACCCCAGCCCCCAGCGAGCCGACGTCCCCACCCGTTCCTGCTCTCATCCCCAGGTTGGGCACGTGGGGTTCCTCCTCTGTGGGCCTGGCAGACCCTTCATGAGTGGGACCCAAGATATCACTGACTTCAACCCAGAGGATCGAGCCCCTGCACCCTGCCTGGGGCCCTGGGGTGTGGAGCAGTGGCTGGGGTGGGCGTGGTGTGGCCTGAGAGACTGCCCAGCTGGAGAGGCCTTCCTTTACAAGGCCACGCGTGCAGCTGTCCCATCCAGACCCCGACTGGCCAAGACCTCCACGTCCCCAGAGTCCAGCCCTGGAAATTCCAAGGGCCCTGGCGTCCTCTGCCTTCCCCGCTTCCCCATGAGCGTCTGCAAAACACTTGCCTGAATACATATCACGTATTTTAGACTCGAAGCCTCAAAGCACTGGATTGTGGTCCCCTGCCCCCTCTGTCCCGTCCCCCTGCCCAAGTGACTGAAACCTACTGAGCTATATTCACTGTGCTGTCCTAGGGGGAGGGAGAGCAGAGCTCGCCCCTGCACTGCAGCCTTGTGGGGGAGGGCAAGGCTCTCCTCCCAGCCAGGGACGCCAGGACATAGCTGCTCCTGGTCAGTGGAGGTCAGCCGGGTATCAAAAGCCATGAAACTGTGTCTCTGTAGCAATGAGTGATACTGTGACAAAACCATCCTTGCATTCTTCCTAGAAGAGTTCCTCTGCTCCTTCCATTCCATTTTTGTGTTTGTTTTGTTCTTTTCTGTCACTGATCCGTATTACCACTTTTGGAAAAAAATAAATAAATAAATAAATAAAAGGCAGCTTGAGTTTCCAAACGTGTGATTCACTTGTGAACAAAAGTCATTCTAACAATTGCCTTCAGCGTCACGTGCATTGCCACTGCGCTTTCGGCACGAGGGATGCTGAGCCCTGGTGTCAGAGTCGTAATTTAAAGCGTGTGTGTATATGGACTTTGTCCCTTAAGGTCGATATAAAGAATCCTCGCAGAATCACAGACCTGTGCCGCCCGCCACCTTCTGCCATTGTTACATTACAGATTTGGTTTAGTTTTGTTTTGTTTTGTTTTTTCTTTTAGAACTGTATAGTATTGAAAAAGAAATCAAATGTAAATGTCTGGTTTTCATATAATGTTTAAAAAGACCATTGAGAAGGAGGCTGGCGCTCGCCCCATGTCCCCCTTGATTGTAAATTGCTTCTGTTCTGTTTATAAGTAAACTGTGCATGACTCCTGCTTAGCGGTCATTATCGTGTCTGTTGGTGAAATTTTTATTAAAAGGAAAATTCTGTAGATGCACTTATTGAATATGTGATTAGGATCTACGTCTGAGACTAGGAGTCCTGAACTGCTGACGCGAAAGAGGCGCAGTTCCCAATTAATACGGAAATCGCTGTGGGAGAAGAATGAAATAAGACGTGAAGTGTAGGAAATCATGAAAAGAACAATTTTGCAAATTGCATTCTGATGCTTGTGATGAACACAAATGTACTTGTGTAGAGACATTTCCTTAAGAGAAAGCCTAGGAGAAGCCGATTTGGAGGTTAATGCTGTAGAATAGGACTGTATACCAAATGTAATCTTTCCAATGCTCCAATGAATTTATACATGAGATTGATATGCAATAAATCTGTGTGCTTTTCTAA +>ENST00000512462 +AAGCACAAGGCCCCATCTCACCAGGTCAGCGGAGATGCTGCCTGCCTGGAGCTCGGGTCCCATGGGGTTGGGGGCGAAGATGCTGCATCCCAGTGCTGTTCCCTGCTCGGGGCCCTGGAAGCAGAGCGGCCTGGCTTCTCTCATTGGCCAAAGAGGGTTTGGAAGCAAATACTGACGGACGTGGAAGTGTCGCCCCAGGAAGGCTGCATCACAAAGATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAGATTTACTATAAAGTCATTAAGGACATTGAGCCAGGTGAGGAGCTGCTGGTGCACGTGAAGGAAGGCGTCTACCCCCTGGGCACAGTGCCGCCCGGCCTGGACGAGGAGCCCACGTTCCGCTGTGACGAGTGTGACGAACTCTTCCAGTCCAAGCTGGACCTGCGGCGCCATAAGAAGTACACGTGTGGCTCAGTGGGGGCTGCGCTCTACGAGGGCCTGGCTGAGGAGCTCAAGCCCGAGGGCCTTGGCGGTGGCAGCGGCCAAGCCCACGAGTGCAAGGACTGCGAGCGGATGTTCCCCAACAAGTACAGCCTGGAGCAGCACATGGTCATCCACACGGAGGAGCGCGAGTACAAATGCGACCAGTGTCCCAAGGCCTTCAACTGGAAGTCCAACCTCATCCGCCACCAGATGTCCCACGACAGCGGCAAACGCTTCGAATGTGAAAACTGCGTGAAGGTGTTCACGGACCCCAGCAACCTTCAGCGGCACATCCGCTCGCAGCACGTGGGCGCTCGGGCCCACGCCTGCCCCGACTGCGGGAAGACCTTCGCCACGTCCTCCGGCCTCAAGCAGCACAAGCATATCCACAGCACGGTGAAGCCTTTCATATGTGAGGTCTGCCACAAGTCCTACACGCAGTTCTCCAACCTGTGCCGGCACAAGCGGATGCACGCCGACTGCCGCACGCAGATCAAGTGCAAGGACTGTGGCCAGATGTTCAGCACTACCTCCTCCCTCAACAAGCACCGGCGCTTCTGCGAGGGCAAGAACCATTACACGCCGGGCGGCATCTTTGCCCCGGGCCTGCCCTTGACCCCCAGCCCCATGATGGACAAGGCAAAACCCTCCCCCAGCCTCAATCACGCCAGCCTGGGCTTCAACGAGTACTTTCCCTCCAGGCCGCACCCGGGGAGCCTGCCCTTCTCCACGGCGCCTCCCACGTTCCCCGCACTCACCCCCGGCTTCCCGGGCATCTTCCCTCCATCCTTGTACCCCCGGCCGCCTCTGCTACCTCCCACATCGCTGCTCAAGAGCCCCCTGAACCACACCCAGGACGCCAAGCTCCCCAGTCCCCTGGGGAACCCAGCCCTGCCCCTGGTCTCCGCCGTCAGCAACAGCAGCCAGGGCACGACGGCAGCTGCGGGGCCCGAGGAGAAGTTCGAGAGCCGCCTGGAGGACTCCTGTGTGGAGAAGCTGAAGACCAGGAGCAGCGACATGTCGGACGGCAGTGACTTTGAGGACGTCAACACCACCACGGGGACCGACCTGGACACGACCACGGGGACGGGCTCGGACCTGGACAGCGACGTGGACAGCGACCCTGACAAGGACAAGGGCAAGGGCAAGTCCGCCGAGGGCCAGCCCAAGTTTGGGGGCGGCTTGGCGCCCCCGGGGGCCCCGAACAGCGTGGCCGAGGTGCCTGTCTTCTATTCCCAGCACTCATTCTTCCCGCCACCCGACGAGCAGCTGCTGACTGCAACGGGCGCCGCCGGGGACTCCATCAAGGCCATCGCATCCATTGCCGAGAAGTACTTTGGCCCCGGCTTCATGGGGATGCAGGAGAAGAAGCTGGGCTCGCTCCCCTACCACTCGGCGTTCCCCTTCCAGTTCCTGCCCAACTTCCCCCACTCCCTTTACCCCTTCACGGACCGAGCCCTCGCCCACAACTTGCTGGTCAAGGCCGAGCCAAAGTCACCCCGGGACGCCCTCAAGGTGGGCGGCCCCAGTGCCGAGTGCCCCTTTGATCTCACCACCAAGCCCAAAGACGTGAAGCCCATCCTGCCCATGCCCAAGGGCCCCTCGGCCCCCGCATCCGGCGAGGAGCAGCCGCTGGACCTGAGCATCGGCAGCCGGGCCCGTGCCAGCCAAAACGGCGGCGGGCGGGAGCCCCGCAAGAACCACGTCTATGGGGAACGCAAGCTGGGCGCCGGCGAGGGGCTGCCCCAGGTGTGCCCGGCGCGGATGCCCCAGCAGCCCCCGCTCCACTACGCCAAGCCCTCGCCCTTCTTCATGGACCCCATCTACAGCAGGGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAGATGTCAGCCATAGAGACCATGACAGAGAAGCTGGAGAGCTTTGCAGCCATGAAGGCGGACTCGGGCAGCTCCCTGCAGCCCCTCCCCCACCACCCCTTCAACTTCCGGTCCCCACCCCCAACGCTCTCCGACCCCATCCTCAGGAAGGGCAAGGAGCGATACACGTGCAGGTACTGTGGGAAGATCTTCCCCAGATCAGCCAATCTCACCAGACACCTGAGGACGCACACTGGGGAGCAGCCGTACAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACGGGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAGGTGTGCTGAGGACCACGAAGGCGGTCTGTTAGCTTTGGAGCCGATGCCGACTTTTGGGAAGGGGCTGGACCTCCGCAGAGCAGCTGAGGAAGCATTTGAAGTTAAAGATGTGCTTAATTCCACCTTAGATTCTGAGGCTTTAAAACATACACTGTGCAGGCAGGCTAAGAACCAGGCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCT +>ENST00000463591 +ACAAAGATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAGATGAAAGTGAAATTGGAGTGAAGGAAAATTGGGCTTGAGGCGCATAGAAGGACGGTCTTTCCGTCCCCTTCTGGGGCTCAGATTTGCAGAGTGTGTCCTTAGTCGTCCGTTGGGAAGCTGACGGGCAGGGGCACCGCGGGGCTGGGCCAGGGCTGTGCTTTTGTGAGATGCAAACTATAGTAATGAAGGGCCCAGATTTTTTTTATTTAAGAAATAAATGTTTATTAGAACTTTTGAACTAAA +>ENST00000509860 +ATTTACTATAAAGTCATTAAGGACATTGAGCCAGGTGAGGAGCTGCTGGTGCACGTGAAGGAAGGCGTCTACCCCCTGGGCACAGTGCCGCCCGGCCTGGACGAGGAGCCCACGTTCCGCTGTGACGAGTGTGACGAACTCTTCCAGTCCAAGCTGGACCTGCGGCGCCATAAGAAGTACACGTGTGGCTCAGTGGGGGCTGCGCTCTACGAGGGCCTGGCTGAGGAGCTCAAGCCCGAGGGCCTTGGCGGTGGCAGCGGCCAAGCCCACGAGTGCAAGGACTGCGAGCGGATGTTCCCCAACAAGTACAGCCTGGAGCAGCACATGGTCATCCACACGGAGGAGCGCGAGTACAAATGCGACCAGTGTCCCAAGGCCTTCAACTGGAAGTCCAACCTCATCCGCCACCAGATGTCCCACGACAGCGGCAAACGCTTCGAATGTGAAAACTGCGTGAAGGTGTTCACGGACCCCAGCAACCTTCAGCGGCACATCCGCTCGCAGCACGTGGGCGCTCGGGCCCACGCCTGCCCCGACTGCGGGAAGACCTTCGCCACGTCCTCCGGCCTCAAGCAGCACAAGCATATCCACAGCACGGTGAAGCCTTTCATATGTGAGGTCTGCCACAAGTCCTACACGCAGTTCTCCAACCTGTGCCGGCACAAGCGGATGCACGCCGACTGCCGCACGCAGATCAAGTGCAAGGACTGTGGCCAGATGTTCAGCACTACCTCCTCCCTCAACAAGCACCGGCGCTTCTGCGAGGGCAAGAACCATTACACGCCGGGCGGCATCTTTGCCCCGGGCCTGCCCTTGACCCCCAGCCCCATGATGGACAAGGCAAAACCCTCCCCCAGCCTCAATCACGCCAGCCTGGGCTTCAACGAGTACTTTCCCTCCAGGCCGCACCCGGGGAGCCTGCCCTTCTCCACGGCGCCTCCCACGTTCCCCGCACTCACCCCCGGCTTCCCGGGCATCTTCCCTCCATCCTTGTACCCCCGGCCGCCTCTGCTACCTCCCACATCGCTGCTCAAGAGCCCCCTGAACCACACCCAGGACGCCAAGCTCCCCAGTCCCCTGGGGAACCCAGCCCTGCCCCTGGTCTCCGCCGTCAGCAACAGCAGCCAGGGCACGACGGCAGCTGCGGGGCCCGAGGAGAAGTTCGAGAGCCGCCTGGAGGACTCCTGTGTGGAGAAGCTGAAGACCAGGAGCAGCGACATGTCGGACGGCAGTGACTTTGAGGACGTCAACACCACCACGGGGACCGACCTGGACACGACCACGGGGACGGGCTCGGACCTGGACAGCGACGTGGACAGCGACCCTGACAAGGACAAGGGCAAGGGCAAGTCCGCCGAGGGCCAGCCCAAGTTTGGGGGCGGCTTGGCGCCCCCGGGGGCCCCGAACAGCGTGGCCGAGGTGCCTGTCTTCTATTCCCAGCACTCATTCTTCCCGCCACCCGACGAGCAGCTGCTGACTGCAACGGGCGCCGCCGGGGACTCCATCAAGGCCATCGCATCCATTGCCGAGAAGTACTTTGGCCCCGGCTTCATGGGGATGCAGGAGAAGAAGCTGGGCTCGCTCCCCTACCACTCGGCGTTCCCCTTCCAGTTCCTGCCCAACTTCCCCCACTCCCTTTACCCCTTCACGGACCGAGCCCTCGCCCACAACTTGCTGGTCAAGGCCGAGCCAAAGTCACCCCGGGACGCCCTCAAGGTGGGCGGCCCCAGTGCCGAGTGCCCCTTTGATCTCACCACCAAGCCCAAAGACGTGAAGCCCATCCTGCCCATGCCCAAGGGCCCCTCGGCCCCCGCATCCGGCGAGGAGCAGCCGCTGGACCTGAGCATCGGCAGCCGGGCCCGTGCCAGCCAAAACGGCGGCGGGCGGGAGCCCCGCAAGAACCACGTCTATGGGGAACGCAAGCTGGGCGCCGGCGAGGGGCTGCCCCAGGTGTGCCCGGCGCGGATGCCCCAGCAGCCCCCGCTCCACTACGCCAAGCCCTCGCCCTTCTTCATGGACCCCATCTACAGGGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAGATGTCAGCCATAGAGACCATGACAGAGAAGCTGGAGAGCTTTGCAGCCATGAAGGCGGACTCGGGCAGCTCCCTGCAGCCCCTCCCCCACCACCCCTTCAACTTCCGGTCCCCACCCCCAACGCTCTCCGACCCCATCCTCAGGAAGGGCAAGGAGCGATACACGTGCAGGTACTGTGGGAAGATCTTCCCCAGATCAGCCAATCTCACCAGACACCTGAGGACGCACACTGGGGAGCAGCCGTACAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACGGGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAGGTGTGCTGAGGACCACGAAGGCGGTCTGTTAGCTTTGGAGCCGATGCCGACTTTTGGGAAGGGGCTGGACCTCCGCAGAGCAGCTGAGGAAGCATTTGAAGTTAAAGATGTGCTTAATTCCACCTTAGATTCTGAGGCTTTAAAACATACACTGTGCAGGCAGGCTAAGAACCAGGCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAATCAGCCAGTGGGCAGGTGGACGCTCTGCTGAGACAGAAGCTGGTGGCCACTGCCGGGTGCCCGCGTGGGGTCGCGGAAGGGAATGGATAGACTGGTGTGCTCAAAAGAGAGAGATCACTCAAATGATTTTTATAATGAAATGACAAGAATAACCCTTTTGGTAACCGTATTGACTGCAGAGTCTATTTAAGCATGTGG +>ENST00000378389 +TGCCGGCCCCGCGGCCTGGGGGCCAGGGAGACCCAGACAACAGAGGGCAGGAGACGCCGGAGGGTCGGGCGCACCGCCTGCCCAGGGGACACGGGGCACACTCCAGGGGGATCCACCAGCCAGCCACAGAACAGTAGGAGGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACGGGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAGGCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAA +>ENST00000606170 +TACAGGCGCCCACCACCACGACTGGCTGATTTTTTTGTATTTTTAGTAGAGACGGGGTTTCACCATGTCAGCCAGGATGGTCTCGATCTCCTGACCTCGTGATCCACCCGCCTTGGCCTCCCAAAGTGCTGTGATTATAGGCGTGAACCCCTGCTTCTTGAAGCCGGGGCTGTTTCTAGGGACAGCTTCCCCAGGATGCCTTTGGCTCTGCAGCTGGGAGATCCAGCAACCTCCGGGACACGGCGGGGCAAAGCTGTGCACGGGGCACGGGGCAGGGGCGCGGGCTCCCTTCCCCCCACCCTCTGTGGCCCGGCCTGCCATGCAGAGCCGGGGCCTGCACTGAGGAGCGCGTGTGCCCCTTCCAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCT diff --git a/pygtftk/data/mini_real_10M/expected_sequence_plus_exon.fa b/pygtftk/data/mini_real_10M/expected_sequence_plus_exon.fa new file mode 100644 index 00000000..35d6fde5 --- /dev/null +++ b/pygtftk/data/mini_real_10M/expected_sequence_plus_exon.fa @@ -0,0 +1,222 @@ +>ENSE00003759395 +CGGCCTCACGCGTCCGTGCAGCGGAGGCTTCCTGAGCCCCCTGGAGAGCCTGGCCTGGGCCCGGGTGTGGAGACCCTCCCGGGCTTTCAATCCGGGCAGGAGGCAGATGGCAGACTCAGCAGTCACGTAAGAGAACCGAATTAG +>ENSE00003755319 +ACGCGTCCGTGCAGCGGAGGCTTCCTGAGCCCCCTGGAGAGCCTGGCCTGGGCCCGGGTGTGGAGACCCTCCCGGGCTTTCAATCCGGGCAGGAGGCAGATGGCAGACTCAGCAGTCAC +>ENSE00003755395 +GAATCGCTTAATTCTGAAAGTCTGGTGAGAAGACACGGCGAGAATCGGGGTCCAGCACAGATGATGGCGACAGCGGAGAAGGGAAG +>ENSE00001480807 +CGCAGGCTCGGCGGCACGCCCCCTGACGTGTGTGCCTCAGGCTTATAATAGGGCCGGTGCTGCCTGCCGAAGCCGGCGGCTGAGAGGCAGCGAACTCATCTTTGCCAGTACAGGAGCTTGTGCCGTGGCCCACAGCCCACAGCCCACAGCCATG +>ENSE00001480799 +GGCTGGGACCTGACGGTGAAGATGCTGGCGGGCAACGAATTCCAGGTGTCCCTGAGCAGCTCCATGTCGGTGTCAGAGCTGAAGGCGCAGATCACCCAGAAGATCGGCGTGCACGCCTTCCAGCAGCGTCTGGCTGTCCACCCGAGCGGTGTGGCGCTGCAGGACAGGGTCCCCCTTGCCAGCCAGGGCCTGGGCCCCGGCAGCACGGTCCTGCTGGTGGTGGACAAATGCGACGAACCTCTGAGCATCCTGGTGAGGAATAACAAGGGCCGCAGCAGCACCTACGAGGTACGGCTGACGCAGACCGTGGCCCACCTGAAGCAGCAAGTGAGCGGGCTGGAGGGTGTGCAGGACGACCTGTTCTGGCTGACCTTCGAGGGGAAGCCCCTGGAGGACCAGCTCCCGCTGGGGGAGTACGGCCTCAAGCCCCTGAGCACCGTGTTCATGAATCTGCGCCTGCGGGGAGGCGGCACAGAGCCTGGCGGGCGGAGCTAAGGGCCTCCACCAGCATCCGAGCAGGATCAAGGGCCGGAAATAAAGGCTGTTGTAAAGAGAAA +>ENSE00003756535 +GGCTGGGACCTGACGGTGAAGATGCTGGCGGGCAACGAATTCCAGGTGTCCCTGAGCAGCTCCATGTCGGTGTCAGAGCTGAAGGCGCAGATCACCCAGAAGATCGGCGTGCACGCCTTCCAGCAGCGTCTGGCTGTCCACCCGAGCGGTGTGGCGCTGCAGGACAGGGTCCCCCTTGCCAGCCAGGGCCTGGGCCCCGGCAGCACGGTCCTGCTGGTGGTGGACAAATGCGACGAACCTCTGAGCATCCTGGTGAGGAATAACAAGGGCCGCAGCAGCACCTACGAGGTACGGCTGACGCAGACCGTGGCCCACCTGAAGCAGCAAGTGAGCGGGCTGGAGGGTGTGCAGGACGACCTGTTCTGGCTGACCTTCGAGGGGAAGCCCCTGGAGGACCAGCTCCCGCTGGGGGAGTACGGCCTCAAGCCCCTGAGCACCGTGTTCATGAATCT +>ENSE00001648978 +GCCCTTTGCTGCGGCAGCTTTCTGTTCTCCCTGGCTCCCTGCACGGAACTGAGCTTTG +>ENSE00001621165 +GTGTGTGATGCGCTGCTGGCCCAGGCTACACCCCGACAAGGGACACCGGGGGCCCCGGGAGCAGAGAGACCTCAGAGCAGCCTCCTCCTGCCTCCTGTGGACGGCCGGCCCCAGCTGGTGATCCCAGCCAGTCCCAGCTTTCAGTTGCTGCCCCCACCGACAGTCCTCAGTCCCTCCATGATGGCTCCCCCGACAGCCGGCCCCCTTCCTGGCCCAGCTCTTCCGCCTGAGGACCCAGGGCCGGATCCGGAGAGCAGGTGGCTTTTCTTGAGCGCCAACATTCTGCCCGTGG +>ENSE00001780479 +CACGGGCGGGCGCGGCAGGGCAGCGTGTGGGGCTGCGATCGGCATGGGCTCTGCGCGCGGGGTGCCCCTGCTCGGGCTGGGGCTCAGGGGACGCCGGGGGCCAGCACAGGGCCCGGTGTCCCTCGGGCCGTGCCGGTAACTGGGATTGGCACCCGCCGGCCATGGAAGAGCCTGGGCCCCCAGGTGGGCTCAGCCAAGACCAAG +>ENSE00003473982 +GCGGCTGCGTCAGGGATTCCTTGGTGGCCCTGGAGGGTGGATAGGCTGGCCTGGGGGCCATCAGGACAGCAGGTGACGGTCAGGCCAATGCCAGCCGGGCCTGGGCACAGCCCTGTGGGGGCTTCGGAGGGCCCTGAGGAGGAGGAGGAAGAGGCAGAGGAGAGAAGGCCCCACGGAGGTCCTGTCGCCAGCGCTGCCACTGCCTGACCTCCGCTGCCCGAAGGCCGGTGGGCCTCTGTGGCCTCCGTGAAGCAGGCCCGGCTGTCGTCAGGCCATGTCTGGTCCATGGCCCTCCCCCGACAGCCGGACCAAGGGAACGGTGGCCTGGCTGGCGGAGGTACTCCTCTGGGTTGGAGGGAGTGTGGTGCTGTCTTCAGAGTGGCAGCTCGGCCCCCTGG +>ENSE00003499259 +TGGAGCGGTGCATGGGTGCCATGCAAGAGGGGATGCAGATGGTGAAGCTGCGTGGCGGCTCCAAGGGCCTGGTCCGCTTCTACTACCTGGACGAGCACCGCTCCTGCATCCGCTGGAGGCCCTCACGCAAGAACGAGAAGGCCAAGA +>ENSE00001477669 +CACAGGGAACGGGTAGGGTCCCACGGTTTGGGGAGAGACATGGCAGTCCTCAAGGGCTGGGATCAGGGCGCAGCCAGGGTTTCTGATGGCTTTGCTGATGGTCAGGACCCAGGCATGCCAGGCAAGGCCTCAGCCCAGCAGTTGCCAAGCGTGTAGCCACTTTGGGCCCGTGGAGAGAGTCGCGCTGCGGAGCCCCCAGGGGGACCTGAGGTCACAAGAGCCTCGATGCACCTGAGCGCGGAGCTGGGGGTCCCTGGAGCCGCTGTCCCCACCTGCGGCGCTGGAGCCCTGGAGGTGTCCAGGGGCTTCCTTGGAACGTGGAGACGTGCTGGTTAAACGTGGAGCCCCGGGCCAGCCGGGCACTGGGGGCTGCAGGTGGAGGGAGGTGGATGCTCTCCCTCGTGGGGGCGTGTCTTTTCCACAGGAAAGGGAAAGGGGGAGGGACACGGGTCAGCAGTGGGGGGCTGTGCAGTCTCGCAGATCTTCACCCTTGGTTCTTGAACTCTGGACCCTGAGCCCTGCCGAGGGTCCCGCAAAGGTGGGCAAGGAGCTCCCGGCTGCTTGGTCTCCGCAGTGTTGGGGCTGCCAGCAGGGGGACGCTGGGCCCCCGGGGACCTGACCCGTGCTCCCTCCCCACCCCGCAGTCTCCATCGACTCCATCCAGGAGGTGAGTGAGGGGCGGCAGTCGGAGGTCTTCCAGCGCTACCCTGACGGCAGCTTCGACCCCAACTGCTGCTTCAGCATCTACCACGGCAGCCACCGCGAGTCGCTGGACCTGGTCTCCACCAGCAGCGAGGTGGCGCGCACCTGGGTCACTGGCCTGCGCTACCTCATGGCCGGCATCAGCGACGAGGACAGCCTGGCTCGCCGCCAGCGCACCAGGGACCAA +>ENSE00001477672 +TCTCCATCGACTCCATCCAGGAGGTGAGTGAGGGGCGGCAGTCGGAGGTCTTCCAGCGCTACCCTGACGGC +>ENSE00001400676 +TCTCCATCGACTCCATCCAGGAGGTGAGTGAGGGGCGGCAGTCGGAGGTCTTCCAGCGCTACCCTGACGGCAGCTTCGACCCCAACTGCTGCTTCAGCATCTACCACGGCAGCCACCGCGAGTCGCTGGACCTGGTCTCCACCAGCAGCGAGGTGGCGCGCACCTGGGTCACTGGCCTGCGCTACCTCATGGCCGGCATCAGCGACGAGGACAGCCTGGCTCGCCGCCAGCGCACCAGGGACCAA +>ENSE00001477687 +TCTCCATCGACTCCATCCAGGAGGTGAGTGAGGGGCGGCAGTCGGAGGTCTTCCAGCGCTACCCTGACGGCAGCTTCGACCCCAACTGCTGCTTCAGCATCTACCACGGCAGCCACCGCGAGTCGCTGGACCTGGTCTCCACCAGCAGCGAGGTGGCGCGCACCTGGGTCACTGGCCTGCGCTACCTCATGGCCGGCATCAGCGACGAGGACAGCCTGGCTCGCCGCCAGCGCACCAGGGACCA +>ENSE00001376863 +GGCGCGCACCTGGGTCACTGGCCTGCGCTACCTCATGGCCGGCATCAGCGACGAGGACAGCCTGGCTCGCCGCCAGCGCACCAGGGACCAA +>ENSE00001477685 +GTGGCTGAAGCAGACGTTTGACGAGGCCGACAAGAACGGGGATGGCAGCCTGAGCATTGGCGAGGTCCTGCAGCTGCTGCACAAGCTCAACGTGAACCTGCCCCGGCAGAGGGTGAAGCAGATGTTCAGG +>ENSE00003553212 +TGGCTGAAGCAGACGTTTGACGAGGCCGACAAGAACGGGGATGGCAGCCTGAGCATTGGCGAGGTCCTGCAGCTGCTGCACAAGCTCAACGTGAACCTGCCCCGGCAGAGGGTGAAGCAGATGTTCAGG +>ENSE00003470263 +TGGCTGAAGCAGACGTTTGACGAGGCCGACAAGAACGGGGATGGCAGCCTGAGCATTGGCGAGGTCCTGCAGCTGCTGCACAAGCTCAACGTGAACCTGCCCCGGCAGAGGGTGAAGCAGATGTTCAGG +>ENSE00003472793 +GAAGCGGACACGGATGACCACCAAGGGACGCTGGGTTTTGAAGAGTTCTGTGCCTTCTACAAGATGATGTCCACCCGCCGGGACCTCTACCTGCTCATGCTGACCTACAGCAACCACAAGGACCACCTGGATGCCGCCAGCCTGCAGCGCTTCCTGCAGGTGGAGCAGAAG +>ENSE00003647310 +GAAGCGGACACGGATGACCACCAAGGGACGCTGGGTTTTGAAGAGTTCTGTGCCTTCTACAAGATGATGTCCACCCGCCGGGACCTCTACCTGCTCATGCTGACCTACAGCAACCACAAGGACCACCTGGATGCCGCCAGCCTGCAGCGCTTCCTGCAGGTGGAGCAGAAG +>ENSE00003465003 +ATGGCGGGTGTGACCCTCGAGAGCTGCCAGGACATCATCGAGCAGTTTGAGCCATGCCCAGAAAACAAGAGTAAGGGGCTGCTGGGCATTGATG +>ENSE00003649862 +ATGGCGGGTGTGACCCTCGAGAGCTGCCAGGACATCATCGAGCAGTTTGAGCCATGCCCAGAAAACAAGAGTAAGGGGCTGCTGGGCATTGATG +>ENSE00003688902 +GCTTCACCAACTACACCAGGAGCCCTGCTGGTGACATCTTCAACCCTGAGCACCACCATGTGCACCAGGACATGACGCAGCCGCTGAGCCACTACTTCATCACCTCGTCCCACAACACCTACCTCGTGGGTGACCAGCTCATGTCCCAGTCACGGGTGGACATGTATGCTTGGGTCCTGCAGGCTGGCTGCCGCTGCGTGGAGG +>ENSE00003533538 +GCTTCACCAACTACACCAGGAGCCCTGCTGGTGACATCTTCAACCCTGAGCACCACCATGTGCACCAGGACATGACGCAGCCGCTGAGCCACTACTTCATCACCTCGTCCCACAACACCTACCTCGTGGGTGACCAGCTCATGTCCCAGTCACGGGTGGACATGTATGCTTGGGTCCTGCAGGCTGGCTGCCGCTGCGTGGAGG +>ENSE00003546186 +TGGACTGCTGGGATGGGCCCGACGGGGAGCCCATTGTGCACCATGGCTACACTCTGACTTCCAAGATCCTCTTCAAAGACGTCATTGAAACCATCAACAAATATGCCTTCATCAAGAATGA +>ENSE00003552203 +TGGACTGCTGGGATGGGCCCGACGGGGAGCCCATTGTGCACCATGGCTACACTCTGACTTCCAAGATCCTCTTCAAAGACGTCATTGAAACCATCAACAAATATGCCTTCATCAAGAATGA +>ENSE00003472855 +GTACCCAGTGATCCTGTCCATCGAAAACCACTGCAGTGTCATCCAGCAGAAGAAAATGGCCCAGTATCTGACTGACATCCTTGGGGACAAGCTGGACCTGTCATCAGTGAGCAGTGAAGATGCCACCACACTCCCCTCTCCACAGATGCTCAAGGGCAAGATCCTCGTGAAG +>ENSE00003605114 +GTACCCAGTGATCCTGTCCATCGAAAACCACTGCAGTGTCATCCAGCAGAAGAAAATGGCCCAGTATCTGACTGACATCCTTGGGGACAAGCTGGACCTGTCATCAGTGAGCAGTGAAGATGCCACCACACTCCCCTCTCCACAGATGCTCAAGGGCAAGATCCTCGTGAAG +>ENSE00003517403 +GGGAAGAAGCTCCCAGCCAACATCAGCGAGGATGCGGAGGAAGGCGAGGTGTCTGATGAGGACAGTGCTGATGAGATTGACGATGACTGCAAGCTCCTCAATGGGGAT +>ENSE00003655153 +GGGAAGAAGCTCCCAGCCAACATCAGCGAGGATGCGGAGGAAGGCGAGGTGTCTGATGAGGACAGTGCTGATGAGATTGACGATGACTGCAAGCTCCTCAATGGGGAT +>ENSE00003582994 +GCATCCACCAATCGAAAGCGTGTAGAAAACACTGCTAAGAGGAAACTGGATTCCCTCATCAAAGAGTCGAAGATTCGGGACTGTGAGGACCCCAACAACTTCTCCGTCTCCACACTGTCCCCATCTGGAAAGCTCGGACGCAAG +>ENSE00003543912 +GCATCCACCAATCGAAAGCGTGTAGAAAACACTGCTAAGAGGAAACTGGATTCCCTCATCAAAGAGTCGAAGATTCGGGACTGTGAGGACCCCAACAACTTCTCCGTCTCCACACTGTCCCCATCTGGAAAGCTCGGACGCAAG +>ENSE00003684947 +AGCAAGGCTGAAGAGGACGTGGAGTCTGGGGAGGATGCCGGGGCCAGCAGACGCAATGGCCGCCTCGTCGTGGGAAGCTTCTCCAGGCGCAAG +>ENSE00003557083 +AGCAAGGCTGAAGAGGACGTGGAGTCTGGGGAGGATGCCGGGGCCAGCAGACGCAATGGCCGCCTCGTCGTGGGAAGCTTCTCCAGGCGCAAG +>ENSE00003535221 +AAGAAGGGCAGCAAGCTGAAGAAGGCGGCCAGCGTGGAGGAGGGAGATGAGGGTCAGGACTCCCCGGGAGGCCAGAGCCGAGG +>ENSE00003534549 +AAGAAGGGCAGCAAGCTGAAGAAGGCGGCCAGCGTGGAGGAGGGAGATGAGGGTCAGGACTCCCCGGGAGGCCAGAGCCGAGG +>ENSE00003559057 +GGCGACCCGGCAGAAGAAGACCATGAAGCTGTCCCGGGCCCTCTCTGACCTGGTGAAGTACACCAAGTCCGTGGCCACCCACGACATAGAGATGGAGG +>ENSE00003650873 +GGCGACCCGGCAGAAGAAGACCATGAAGCTGTCCCGGGCCCTCTCTGACCTGGTGAAGTACACCAAGTCCGTGGCCACCCACGACATAGAGATGGAGG +>ENSE00003516954 +CGGCGTCCAGCTGGCAGGTGTCGTCCTTCAGCGAGACCAAGGCCCACCAGATTCTGCAGCAGAAGCCGGCGCAGTACCTACGCTTCAACCAGCAGCAGCTCTCCCGCATCTACCCCTCCTCCTACCGTGTGGACTCCAGCAACTACAACCCGCAGCCCTTCTGGAACGCCGGCTGCCAAATGG +>ENSE00003534507 +CGGCGTCCAGCTGGCAGGTGTCGTCCTTCAGCGAGACCAAGGCCCACCAGATTCTGCAGCAGAAGCCGGCGCAGTACCTACGCTTCAACCAGCAGCAGCTCTCCCGCATCTACCCCTCCTCCTACCGTGTGGACTCCAGCAACTACAACCCGCAGCCCTTCTGGAACGCCGGCTGCCAAATGG +>ENSE00003616922 +TTGCCCTGAACTACCAGTCAGAGGGGCGGATGCTGCAGCTGAACCGAGCCAAGTTCAGCGCCAACGGTGGCTGCGGCTACGTACTCAAGCCTGGGTGCATGTGCCAGG +>ENSE00003591218 +TTGCCCTGAACTACCAGTCAGAGGGGCGGATGCTGCAGCTGAACCGAGCCAAGTTCAGCGCCAACGGTGGCTGCGGCTACGTACTCAAGCCTGGGTGCATGTGCCAGG +>ENSE00001940753 +GTGGGGGAACCCTCCTTGCTAGCGTTGCAAAGAAGGGCCCAGCTCCGTCAGGAATCCAGGGATGGAGAACTGGGGAGCCTGGGCCCCACATGAGATTCATGGCAGGACTTGTCTGAGGGGCCCCAGTGCCAGCGACCCAGCCCCCTGTGCCTGGCCCCTCTGTGGGTCTCAGGACCTGGGTCTGGGCTGGGTGTTTGGAGGAACCTCCTCCCGGCTCTCAGACACCTCTGTTTTGTCTGCTGTGGATGACTTCCAGCTTGGTCCCCCTGTGGCCCTGGCAGGAGTATCACCATGGGAGAGGGCAGGACAGGGGCTGGGCGAGCAGGCCTCCCACTAGACCAGGCTACTCCTGCTGTGGACCAGCTACTTCCACCTCTGCCCTTGGCTTGCCCTCCTCAGAGTTCTCAGCCTGAGTGGGCCCTGGGGACACTGTCACCAGAGACCCCACCCCTCATACCCCCAGGGACCCAGACCCACCCCCAGAAGCCATGTGACCTCCTCGGCTCAGCTGTGGGAGGCATGGGCTCTGTCCCACATGCTGCGGTAGCCACAAAGGTGATCCATACTGGGCCAGGTGCACCCCGAGGTGCCCCCCTGGACCACTGCCTCCCTCCCTCCCCCTGGCACCGGCTCCAGTCTCCTATGTGGGGGCTGGGGAGGGGGCTGTTGGCAGCCATGCCCCAGCAAGCAGGGGGCTTGCTGAGGGCTGGGCCACTGACCACCTCCCCGGCATCCCCTCAGGCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAG +>ENSE00003653363 +GCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAG +>ENSE00003541907 +GCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAG +>ENSE00001923708 +GGTGGGGGCCAGCCCCACACAGGCGGGAGGGGTGGGAGTTGGGGGCGGGCCGGGCATCGCGATGGGCCCTGATGCCACCCCCACTCCTGTGTCCCAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACG +>ENSE00003492751 +ATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACG +>ENSE00003466854 +ATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACG +>ENSE00003571083 +GGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAG +>ENSE00003685158 +GGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAG +>ENSE00003658295 +GCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAG +>ENSE00001826643 +GCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTGAGTGTCACCCCCTGCCACCAGCCATCATGGGGAGGGGCCACACCAGCCCCTTGTCCCATGCCCCCCCATGTGTCCCCAGTGCTGGGTCCTGAACTCAGGCAGTGAGGCCTAGGGTCCCCTCCCCGGGCCTCTGCTCCTCTATCTCAAGAGGGGCTGCTGTGGGGGCCTGGCTCCTGAGCCACCAGTGCCCACCTCTGATCTCAGGGCTGGCTTTGGGCATCTCGGGCAGGACAGGTCCTGAGTGCTCCGGGCCTTGCCCCGCCCTGTGTCACCCATGCCTGTCTCAGACTCTTGGGGGCCTTGCAGCCTCCACCCCTACAGTGCTGCCATCTGGCTTCTCAGCAGGGACCGAGTGATGCCCCTCTCCCCTCTACTACCCCCCACCCCTCTACTTCCTGGTGTCACGTGGAAGGCAGCTGCCCGGGTTTGCCTGTGACTCCACACCCAGCATGTCTGTCCCCTGCCCCAGGTCAGGGTGGGGCCTCGGCTTCCGCAGGAAGTGGTCTTGGTGCCAGCCCTGCTGCCCTGGCTTTGAGCTGGGGCCCAGTGCCCTCTGGGTCCTGCTGGCTGCAGCTGGCCCTCGGGGAACCCGCACACACAGCAGGAGGGGCCTGCCCAGGCCCAGTGCTGACTCTCTCCTGCCATGCTCTCGGGCCCAGAGGTGCCATCCAGCCCCTGCCGTCTATCCACCCATCTGTTCCTCGTCCCCCAGGCTGCAGGGCTCCCCACGCCACTGCTGTGGCCGCCTCACCTGCTCCCCCTGTCTCTTTGGTCTTGCAGTCGGCTTCTCTATGGCCACAGCCTACTTTTAGAAGTGCAGCTCTGTTAGGAGCCTTGAAGGTACCCGGTGCGCGGGACAGTGCGGCCCGCCGCCCCTGCATGCCCAGGCCGCACCCCATTAGCATCCATGATTCCTGGTAGCATTTGGAGACTGTCGCTCATGTGACGTGGATCATGACATGGCTCCGGGGGCCCTGGCCATCCCCAGCCATAGTGGCATTTACGAGGCAGATCCAGGGTTCAGCTGGGTGGCCGCCTTCTCACTGGCCTCTCCTCCCCTCCCCTCCCTCAGTCCTCCCTCCCCTCCCTCAGTCCTCCCTCCCCTCCCTCAGTCCTCCCTCCCCTCCCTCAGTCCTCCCTCCCCTCCCTCAGCCCCTTCCCTGGCGGGCAGCCCGCTGGAGCCCCCACTGTGCCCCTCCTATCCCCCTCCTTCTCTCTCCTGCCCCCATCTCGGACCCTCAGGCTGTTGGTTCTGAGTTCGCCTCCCACTCCCTCCCTGTCCTTGCCAACCATGCCAGTGCATGGGATGAGGGCACCCCTGAGGCCGGCGCTCCGAGCCAGAATCCCGGATCTGCTTCTAAATGGCTTCCCAGCCACTGTGACCAAATGCGTAGATTTGGGATCTTGAATCAGGAAGCTGATTCAAGTGCTGGCCATCTGAACGCATCTGCCCAGAGGCGCCCCTGCAGGGGGGTGACCCACCTGCCGGGCCTGGGCCGCTCTGTGCACGAGCACGGCTCGTCATGGGGGCGCGGTGGGTGCTGTCTCGGGGGCATCTGGCATGTGAGGGCCCCTCTGGCCTCTGCGCCCTGGAGATGCGGCTGCCTCCCTCTCAGCAGCTGTTCTGCCCAGGCAGGGACCTCCTGGGCCCAGCTGTCCAGGAAGATTGGCTGTGGCCAGGTGCTGGTGGGCTGGGAGTCTGAGCCCATCTTGGCAGGGCTCAGGGGGCAGCAAGCCAGCTGCGGGCCTTGGGGGCTCACATGAGTGGAGGGCAGGGCAAGACCAGAAAAGGCTGCCTGGGGGAATTCAGGAAGGCTTCCTGGAAGAGGTGGTACTTCCTAGGGCACGAGTATCACCATGGGAGTGGGCAGGACACGGGCCGGGCAAGTGGGCCTCCCGCTGCACCTGGCTACTCCTGCTGTGGACCAGCTACTCCTGCCTGAGGGTGGGGCACACACAACCAGGGAGTGCCACGCCAGTGTCCCCTGCTAGCGCCGGGGGCTGCGGGCCTCTGAGCAGGTGCAGGCTGTGGTGGGCCAGGCTGGGGCTCGAGGTCTCTCCTCCGGAGGGAAAGACCTTCTCTCCATGCCCCTCAAGGGCCCCACATGCCCTGGACAGGTCAGGCGAGGGCAGTTTCTGCCGGAAGGGTGGGGTGGGCCATGTGTACTTAGATCTGTAGCAGCTACTGTCCCAGGCAGAGCTGCCCTAGGGACCCTGCTCCTGAAGGCCCTGGTGTGTCCACACACCCCCAGCCTGAGGTGGCCCAGCCCCTCGGACCGAGACACGCATGGCACGTCTGTGGCACGGTCTGGAGAGCTGGCCCTGGGGGAGCAGCTGCAGCTGGGCTGGGACCCCTGGCAACAGCTACATGGGCTCCTTCTCTTGCAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGGTAAGGCGCCAGCTGCGGTGGCAGAGAAGAGCCCTGTGCGAGTGCGGCCCCCGCGTGTCCTGGACGGCCCCGGGCCTGCTGGGATGGCCGCCACATGCATGAAGTGTGTGGTGGGATCCTGCGCCGGCGTGAACACCGGGGGCCTGCAGAGGGAGCGGCCACCCAGCCCGGGGCCTGCAAGCAGGCAGGCAGCCATTCGCCAGCAGCCCCGGGCCCGGGCTGACTCACTGGGGGCCCCCTGCTGTGGCCTGGACCCTCACGCTATCCCGGGGAGAAGCAGAGAGGCCCCCAAGGGTCCTGGGGCCTGGAGGCAGGGTCCAGGCGGTAGCGGCTCCATGTCCTCGGACTCCAGCAGCCCAGACAGCCCGGGCATCCCCGAAAGGTCCCCCCGCTGGCCTGAGGGTGCCTGCAGGCAACCGGGGGCCCTGCAGGGAGAGATGAGTGCCTTGTTTGCTCAAAAGCTGGAGGAGATCAGGAGTAAATCCCCCATGTTCTCCGCCGGTAAGCCCCTCTTGCCCTGCGTGGTCCTCCCGCACGCCCCTGGCATGGCTGGGCCTGGGTCACCTGCTGCTGCTTCTGCGTGGACGGTGTCGCCTCGTGTGCTCGTGCTCGTGGCTCTGTATCCGTGGCACTGTCTCCGTGGCACTCTGCTCCCTTGGCTTGCCTGTGGCCCATAGCCCCAGCCCTCCTGTCTGAGCTTGAGGCCCTGGGACTTGGGTGGAGCTGGTTTGAGGCCCGACAGGCTGGGAAGAACCAGCTGCTCTTGCTGAGGGTCTGGGGCCGGGACTGTGGCCTGACATGCTGGGCCCCTCCGGCTGGGCGCTTCCCCAAACTCACCTCCTGGGCGGCTGGCGACCTGCATGGCCCCTGATGCCTTTCCTGGGACTGGGGGCCACGTACCATCCCATTCCCACCTCCCTCTAGGGCAGGCTCCAGGGGTCCCTACTGGGAAGTCTGATGTGGGCAGGTAGTGCAGCTGCTGGGCGTCTCCTGCGCCCCTGGGACGCCTGGAGCCTGCTGAGTGCTGCGTGGAGTAGATTCCCTGGGCCCCAGGGCTTCGCTGCTTTGGGCTGAAGCACCCCACTAGAAGGGTGTCTCCTTAGCCTGGAGGGAGGGACATACACGGAGCCCGCCCCACACCACCCTGCCCCTCCAGACCCCCCTGACCAAGCTTTCCTTTCTGCCCCCACCCACGCTGCCTCCGTAGTTAGGAACTGAGAGCGGCGAGTGACAGGTAACGGGGCCCAGCCCCGGTGTCCCGTGCTGTCCCAGCCCAAGGAGGGCCCCGTGTGCGGCACAGGGCGTGGACTGGGCCCCAGCAGCAGCAGGGTGGGGACACCGAGTGTGCCGCGCCCGGGGGATGCCTCGGGGTGGGAGCTGGGCCTGGCGACCCTCGGCACAGGGCACCGGGGACACCACCCTGATCCGACTCCTCTCCGCCTCTCTCCCTGCCTCCCTCTCTCTCTTCTGCTTCTCCCTCTGGCTCTCTCTCACTCCCCCACCTCCCCACAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCCCTT +>ENSE00003609797 +GCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAG +>ENSE00003596489 +GTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAG +>ENSE00001432737 +GTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGGTAAGGCGCCAGCTGCGGTGGCAGAGAAGAGCCCTGTGCGAGTGCGGCCCCCGCGTGTCCTGGACGGCCCCGGGCCTGCTGGGATGGCCGCCACATGCATGAAGTGTGTGGTGGGATCCTGCGCCGGCGTGAACACCGGGGGCCTGCAGAGGGAGCGGCCACCCAGCCCGGGGCCTGCAAGCAGGCAGGCAGCCATTCGCCAGCAGCCCCGGGCCCGGGCTGACTCACTGGGGGCCCCCTGCTGTGGCCTGGACCCTCACGCTATCCCGGGGAGAAGCAGAGAGGCCCCCAAGGGTCCTGGGGCCTGGAGGCAGGGTCCAGGCGGTAGCGGCTCCATGTCCTCGGACTCCAGCAGCCCAGACAGCCCGGGCATCCCCGAAAGGTCCCCCCGCTGGCCTGAGGGTGCCTGCAGGCAACCGGGGGCCCTGCAGGGAGAGATGAGTGCCTTGTTTGCTCAAAAGCTGGAGGAGATCAGGAGTAAATCCCCCATGTTCTCCGCCGGTAAGCCCCTCTTGCCCTGCGTGGTCCTCCCGCACGCCCCTGGCATGGCTGGGCCTGGGTCACCTGCTGCTGCTTCTGCGTGGACGGTGTCGCCTCGTGTGCTCGTGCTCGTGGCTCTGTATCCGTGGCACTGTCTCCGTGGCACTCTGCTCCCTTGGCTTGCCTGTGGCCCATAGCCCCAGCCCTCCTGTCTGAGCTTGAGGCCCTGGGACTTGGGTGGAGCTGGTTTGAGGCCCGACAGGCTGGGAAGAACCAGCTGCTCTTGCTGAGGGTCTGGGGCCGGGACTGTGGCCTGACATGCTGGGCCCCTCCGGCTGGGCGCTTCCCCAAACTCACCTCCTGGGCGGCTGGCGACCTGCATGGCCCCTGATGCCTTTCCTGGGACTGGGGGCCACGTACCATCCCATTCCCACCTCCCTCTAGGGCAGGCTCCAGGGGTCCCTACTGGGAAGTCTGATGTGGGCAGGTAGTGCAGCTGCTGGGCGTCTCCTGCGCCCCTGGGACGCCTGGAGCCTGCTGAGTGCTGCGTGGAGTAGATTCCCTGGGCCCCAGGGCTTCGCTGCTTTGGGCTGAAGCACCCCACTAGAAGGGTGTCTCCTTAGCCTGGAGGGAGGGACATACACGGAGCCCGCCCCACACCACCCTGCCCCTCCAGACCCCCCTGACCAAGCTTTCCTTTCTGCCCCCACCCACGCTGCCTCCGTAGTTAGGAACTGAGAGCGGCGAGTGACAGGTAACGGGGCCCAGCCCCGGTGTCCCGTGCTGTCCCAGCCCAAGGAGGGCCCCGTGTGCGGCACAGGGCGTGGACTGGGCCCCAGCAGCAGCAGGGTGGGGACACCGAGTGTGCCGCGCCCGGGGGATGCCTCGGGGTGGGAGCTGGGCCTGGCGACCCTCGGCACAGGGCACCGGGGACACCACCCTGATCCGACTCCTCTCCGCCTCTCTCCCTGCCTCCCTCTCTCTCTTCTGCTTCTCCCTCTGGCTCTCTCTCACTCCCCCACCTCCCCACAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCCCTTTC +>ENSE00001697293 +GTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGGTAAGGCGCCAGCTGCGGTGGCAGAGAAGAGCCCTGTGCGAGTGCGGCCCCCGCGTGTCCTGGACGGCCCCGGGCCTGCTGGGATGGCCGCCACATGCATGAAGTGTGTGGTGGGATCCTGCGCCGGCGTGAACACCGGGGGCCTGCAGAGGGAGCGGCCACCCAGCCCGGGGCCTGCAAGCAGGCAGGCAGCCATTCGCCAGCAGCCCCGGGCCCGGGCTGACTCACTGGGGGCCCCCTGCTGTGGCCTGGACCCTCACGCTATCCCGGGGAGAAGCAGAGAGGCCCCCAAGGGTCCTGGGGCCTGGAGGCAGGGTCCAGGCGGTAGCGGCTCCATGTCCTCGGACTCCAGCAGCCCAGACAGCCCGGGCATCCCCGAAAGGTCCCCCCGCTGGCCTGAGGGTGCCTGCAGGCAACCGGGGGCCCTGCAGGGAGAGATGAGTGCCTTGTTTGCTCAAAAGCTGGAGGAGATCAGGAGTAAATCCCCCATGTTCTCCGCCG +>ENSE00003540997 +GTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAG +>ENSE00001701479 +TTAGGAACTGAGAGCGGCGAGTGACAGGTAACGGGGCCCAGCCCCGGTGTCCCGTGCTGTCCCAGCCCAAGGAGGGCCCCGTGTGCGGCACAGGGCGTGGACTGGGCCCCAGCAGCAGCAGGGTGGGGACACCGAGTGTGCCGCGCCCGGGGGATGCCTCGGGGTGGGAGCTGGGCCTGGCGACCCTCGGCACAGGGCACCGGGGACACCACCCTGATCCGACTCCTCTCCGCCTCTCTCCCTGCCTCCCTCTCTCTCTTCTGCTTCTCCCTCTGGCTCTCTCTCACTCCCCCACCTCCCCACAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCCC +>ENSE00001834994 +TTAGGAACTGAGAGCGGCGAGTGACAG +>ENSE00001887073 +ACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCCCTT +>ENSE00001783927 +ACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGC +>ENSE00001420069 +ACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCC +>ENSE00002048533 +GGTGTCCAAACTGACAATGCTGGGGAGATGAAGATAGTGTGTGGCTGCTTCTGGACTCAAGGAGGAGGAGAGAGATTCCGCGAGCCGACACCATGCGATCCAAGGCGAGGGCGAGGAAGCTAGCCAAAA +>ENSE00003700259 +AATGCTGGGGAGATGAAGATAGTGTGTGGCTGCTTCTGGACTCAAGGAGGAGGAGAGAGATTCCGCGAGCCGACACCATGCGATCCAAGGCGAGGGCGAGGAAGCTAGCCAAAA +>ENSE00001222906 +GAAGATAGTGTGTGGCTGCTTCTGGACTCAAGGAGGAGGAGAGAGATTCCGCGAGCCGACACCATGCGATCCAAGGCGAGGGCGAGGAAGCTAGCCAAAA +>ENSE00001598723 +GCTGCTTCTGGACTCAAGGAGGAGGAGAGAGATTCCGCGAGCCGACACCATGCGATCCAAGGCGAGGGCGAGGAAGCTAGCCAAAA +>ENSE00003695128 +GTGACGGTGACGTTGTAAATAATATGTATGAGCCCAACCGGGACCTGCTGGCCAGCCACAGCGCGGAGGACGAGGCCGAGGACAGTGCCATGTCGCCCATCCCCGTGGGGCCACCGTCCCCCTTCCCCACCAGCGAGGACTTCACCCCCAAGGAGGGCTCGCCGTACGAGGCCCCTGTCTACATTCCTGAAGACATTCCGATCCCAGCAGACTTCGAGCTCCGAGAGTCCTCCATCCCAGGGGCTGGCCTGGGGGTCTGGGCCAAGAGGAAGATGGAAGCCGGGGAGAGGCTGGGCCCCTGCGTGGTGGTGCCCCGGGCGGCGGCAAAGGAGACAGACTTCGGATGGGAGGTGAGCGATCGCGCCTGAGTATGATTGATCACGGCCATTTATCTTGTGTTCAATCTATTTATAAAGCCGGGCTGAGCAGCCACTGCCCGAGGCGGGAGGCGCGGCCAGAGAGAGCGT +>ENSE00001754112 +GTGACGGTGACGTTGTAAATAATATGTATGAGCCCAACCGGGACCTGCTGGCCAGCCACAGCGCGGAGGACGAGGCCGAGGACAGTGCCATGTCGCCCATCCCCGTGGGGCCACCGTCCCCCTTCCCCACCAGCGAGGACTTCACCCCCAAGGAGGGCTCGCCGTACGAGGCCCCTGTCTACATTCCTGAAGACATTCCGATCCCAGCAGACTTCGAGCTCCGAGAGTCCTCCATCCCAGGGGCTGGCCTGGGGGTCTGGGCCAAGAGGAAGATGGAAGCCGGGGAGAGGCTGGGCCCCTGCGTGGTGGTGCCCCGGGCGGCGGCAAAGGAGACAGACTTCGGATGGGAG +>ENSE00002087812 +AAGCACAAGGCCCCATCTCACCAGGTCAGCGGAGATGCTGCCTGCCTGGAGCTCGGGTCCCATGGGGTTGGGGGCGAAGATGCTGCATCCCAGTGCTGTTCCCTGCTCGGGGCCCTGGAAGCAGAGCGGCCTGGCTTCTCTCATTGGCCAAAGAGGGTTTGGAAG +>ENSE00003480863 +CAAATACTGACGGACGTGGAAGTGTCGCCCCAGGAAGGCTGCATCACAAAG +>ENSE00003516886 +CAAATACTGACGGACGTGGAAGTGTCGCCCCAGGAAGGCTGCATCACAAAG +>ENSE00001882136 +ACAAAG +>ENSE00002034212 +CAGATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAG +>ENSE00003695725 +ATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAG +>ENSE00003662380 +ATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAG +>ENSE00001846205 +ATGAAAGTGAAATTGGAGTGAAGGAAAATTGGGCTTGAGGCGCATAGAAGGACGGTCTTTCCGTCCCCTTCTGGGGCTCAGATTTGCAGAGTGTGTCCTTAGTCGTCCGTTGGGAAGCTGACGGGCAGGGGCACCGCGGGGCTGGGCCAGGGCTGTGCTTTTGTGAGATGCAAACTATAGTAATGAAGGGCCCAGATTTTTTTTATTTAAGAAATAAATGTTTATTAGAACTTTTGAACTAAA +>ENSE00003697266 +ATTTACTATAAAGTCATTAAGGACATTGAGCCAGGTGAGGAGCTGCTGGTGCACGTGAAGGAAGGCGTCTACCCCCTGGGCACAGTGCCGCCCGGCCTGGACG +>ENSE00003700221 +ATTTACTATAAAGTCATTAAGGACATTGAGCCAGGTGAGGAGCTGCTGGTGCACGTGAAGGAAGGCGTCTACCCCCTGGGCACAGTGCCGCCCGGCCTGGACG +>ENSE00003696962 +AGGAGCCCACGTTCCGCTGTGACGAGTGTGACGAACTCTTCCAGTCCAAGCTGGACCTGCGGCGCCATAAGAAGTACACGTGTGGCTCAGTGGGGGCTGCGCTCTACGAGGGCCTGGCTGAGGAGCTCAAGCCCGAGGGCCTTGGCGGTGGCAGCGGCCAAGCCCACGAGTGCAAGGACTGCGAGCGGATGTTCCCCAACAAGTACAG +>ENSE00003701239 +AGGAGCCCACGTTCCGCTGTGACGAGTGTGACGAACTCTTCCAGTCCAAGCTGGACCTGCGGCGCCATAAGAAGTACACGTGTGGCTCAGTGGGGGCTGCGCTCTACGAGGGCCTGGCTGAGGAGCTCAAGCCCGAGGGCCTTGGCGGTGGCAGCGGCCAAGCCCACGAGTGCAAGGACTGCGAGCGGATGTTCCCCAACAAGTACAG +>ENSE00003700688 +CCTGGAGCAGCACATGGTCATCCACACGGAGGAGCGCGAGTACAAATGCGACCAGTGTCCCAAGGCCTTCAACTGGAAGTCCAACCTCATCCGCCACCAGATGTCCCACGACAGCGGCAAACGCTTCGAATGTGAAAACTGCGTGAAG +>ENSE00003700436 +CCTGGAGCAGCACATGGTCATCCACACGGAGGAGCGCGAGTACAAATGCGACCAGTGTCCCAAGGCCTTCAACTGGAAGTCCAACCTCATCCGCCACCAGATGTCCCACGACAGCGGCAAACGCTTCGAATGTGAAAACTGCGTGAAG +>ENSE00003700645 +GTGTTCACGGACCCCAGCAACCTTCAGCGGCACATCCGCTCGCAGCACGTGGGCGCTCGGGCCCACGCCTGCCCCGACTGCGGGAAGACCTTCGCCACGTCCTCCGGCCTCAAGCAGCACAAGCATATCCACAGCACGGTGAAGCCTTTCATAT +>ENSE00003695760 +GTGTTCACGGACCCCAGCAACCTTCAGCGGCACATCCGCTCGCAGCACGTGGGCGCTCGGGCCCACGCCTGCCCCGACTGCGGGAAGACCTTCGCCACGTCCTCCGGCCTCAAGCAGCACAAGCATATCCACAGCACGGTGAAGCCTTTCATAT +>ENSE00003695658 +GTGAGGTCTGCCACAAGTCCTACACGCAGTTCTCCAACCTGTGCCGGCACAAGCGGATGCACGCCGACTGCCGCACGCAGATCAAGTGCAAGGACTGTGGCCAGATGTTCAGCACTACCTCCTCCCTCAACAAGCACCGGCGCTTCTGCGAGGGCAAGAACCATTACACGCCGGGCGGCATCTTTGCCCCGGGCCTGCCCTTGACCCCCAGCCCCATGATGGACAAGGCAAAACCCTCCCCCAGCCTCAATCACGCCAGCCTGGGCTTCAACGAGTACTTTCCCTCCAGGCCGCACCCGGGGAGCCTGCCCTTCTCCACGGCGCCTCCCACGTTCCCCGCACTCACCCCCGGCTTCCCGGGCATCTTCCCTCCATCCTTGTACCCCCGGCCGCCTCTGCTACCTCCCACATCGCTGCTCAAGAGCCCCCTGAACCACACCCAGGACGCCAAGCTCCCCAGTCCCCTGGGGAACCCAGCCCTGCCCCTGGTCTCCGCCGTCAGCAACAGCAGCCAGGGCACGACGGCAGCTGCGGGGCCCGAGGAGAAGTTCGAGAGCCGCCTGGAGGACTCCTGTGTGGAGAAGCTGAAGACCAGGAGCAGCGACATGTCGGACGGCAGTGACTTTGAGGACGTCAACACCACCACGGGGACCGACCTGGACACGACCACGGGGACGGGCTCGGACCTGGACAGCGACGTGGACAGCGACCCTGACAAGGACAAGGGCAAGGGCAAGTCCGCCGAGGGCCAGCCCAAGTTTGGGGGCGGCTTGGCGCCCCCGGGGGCCCCGAACAGCGTGGCCGAGGTGCCTGTCTTCTATTCCCAGCACTCATTCTTCCCGCCACCCGACGAGCAGCTGCTGACTGCAACGGGCGCCGCCGGGGACTCCATCAAGGCCATCGCATCCATTGCCGAGAAGTACTTTGGCCCCGGCTTCATGGGGATGCAGGAGAAGAAGCTGGGCTCGCTCCCCTACCACTCGGCGTTCCCCTTCCAGTTCCTGCCCAACTTCCCCCACTCCCTTTACCCCTTCACGGACCGAGCCCTCGCCCACAACTTGCTGGTCAAGGCCGAGCCAAAGTCACCCCGGGACGCCCTCAAGGTGGGCGGCCCCAGTGCCGAGTGCCCCTTTGATCTCACCACCAAGCCCAAAGACGTGAAGCCCATCCTGCCCATGCCCAAGGGCCCCTCGGCCCCCGCATCCGGCGAGGAGCAGCCGCTGGACCTGAGCATCGGCAGCCGGGCCCGTGCCAGCCAAAACGGCGGCGGGCGGGAGCCCCGCAAGAACCACGTCTATGGGGAACGCAAGCTGGGCGCCGGCGAGGGGCTGCCCCAGGTGTGCCCGGCGCGGATGCCCCAGCAGCCCCCGCTCCACTACGCCAAGCCCTCGCCCTTCTTCATGGACCCCATCTACAG +>ENSE00003699089 +GTGAGGTCTGCCACAAGTCCTACACGCAGTTCTCCAACCTGTGCCGGCACAAGCGGATGCACGCCGACTGCCGCACGCAGATCAAGTGCAAGGACTGTGGCCAGATGTTCAGCACTACCTCCTCCCTCAACAAGCACCGGCGCTTCTGCGAGGGCAAGAACCATTACACGCCGGGCGGCATCTTTGCCCCGGGCCTGCCCTTGACCCCCAGCCCCATGATGGACAAGGCAAAACCCTCCCCCAGCCTCAATCACGCCAGCCTGGGCTTCAACGAGTACTTTCCCTCCAGGCCGCACCCGGGGAGCCTGCCCTTCTCCACGGCGCCTCCCACGTTCCCCGCACTCACCCCCGGCTTCCCGGGCATCTTCCCTCCATCCTTGTACCCCCGGCCGCCTCTGCTACCTCCCACATCGCTGCTCAAGAGCCCCCTGAACCACACCCAGGACGCCAAGCTCCCCAGTCCCCTGGGGAACCCAGCCCTGCCCCTGGTCTCCGCCGTCAGCAACAGCAGCCAGGGCACGACGGCAGCTGCGGGGCCCGAGGAGAAGTTCGAGAGCCGCCTGGAGGACTCCTGTGTGGAGAAGCTGAAGACCAGGAGCAGCGACATGTCGGACGGCAGTGACTTTGAGGACGTCAACACCACCACGGGGACCGACCTGGACACGACCACGGGGACGGGCTCGGACCTGGACAGCGACGTGGACAGCGACCCTGACAAGGACAAGGGCAAGGGCAAGTCCGCCGAGGGCCAGCCCAAGTTTGGGGGCGGCTTGGCGCCCCCGGGGGCCCCGAACAGCGTGGCCGAGGTGCCTGTCTTCTATTCCCAGCACTCATTCTTCCCGCCACCCGACGAGCAGCTGCTGACTGCAACGGGCGCCGCCGGGGACTCCATCAAGGCCATCGCATCCATTGCCGAGAAGTACTTTGGCCCCGGCTTCATGGGGATGCAGGAGAAGAAGCTGGGCTCGCTCCCCTACCACTCGGCGTTCCCCTTCCAGTTCCTGCCCAACTTCCCCCACTCCCTTTACCCCTTCACGGACCGAGCCCTCGCCCACAACTTGCTGGTCAAGGCCGAGCCAAAGTCACCCCGGGACGCCCTCAAGGTGGGCGGCCCCAGTGCCGAGTGCCCCTTTGATCTCACCACCAAGCCCAAAGACGTGAAGCCCATCCTGCCCATGCCCAAGGGCCCCTCGGCCCCCGCATCCGGCGAGGAGCAGCCGCTGGACCTGAGCATCGGCAGCCGGGCCCGTGCCAGCCAAAACGGCGGCGGGCGGGAGCCCCGCAAGAACCACGTCTATGGGGAACGCAAGCTGGGCGCCGGCGAGGGGCTGCCCCAGGTGTGCCCGGCGCGGATGCCCCAGCAGCCCCCGCTCCACTACGCCAAGCCCTCGCCCTTCTTCATGGACCCCATCTACAG +>ENSE00003702178 +CAGGGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAG +>ENSE00003701451 +CAGGGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAG +>ENSE00001582537 +GGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAG +>ENSE00003699052 +ATGTCAGCCATAGAGACCATGACAGAGAAGCTGGAGAGCTTTGCAGCCATGAAGGCGGACTCGGGCAGCTCCCTGCAGCCCCTCCCCCACCACCCCTTCAACTTCCGGTCCCCACCCCCAACGCTCTCCGACCCCATCCTCAGGAAGGGCAAGGAGCGATACACGTGCAG +>ENSE00003701293 +ATGTCAGCCATAGAGACCATGACAGAGAAGCTGGAGAGCTTTGCAGCCATGAAGGCGGACTCGGGCAGCTCCCTGCAGCCCCTCCCCCACCACCCCTTCAACTTCCGGTCCCCACCCCCAACGCTCTCCGACCCCATCCTCAGGAAGGGCAAGGAGCGATACACGTGCAG +>ENSE00003697785 +GTACTGTGGGAAGATCTTCCCCAGATCAGCCAATCTCACCAGACACCTGAGGACGCACACTGGGGAGCAGCCGTACAG +>ENSE00003698430 +GTACTGTGGGAAGATCTTCCCCAGATCAGCCAATCTCACCAGACACCTGAGGACGCACACTGGGGAGCAGCCGTACAG +>ENSE00001905893 +TGCCGGCCCCGCGGCCTGGGGGCCAGGGAGACCCAGACAACAGAGGGCAGGAGACGCCGGAGGGTCGGGCGCACCGCCTGCCCAGGGGACACGGGGCACACTCCAGGGGGATCCACCAGCCAGCCACAGAACAGTAGGAGG +>ENSE00003697875 +TACAGGCGCCCACCACCACGACTGGCTGATTTTTTTGTATTTTTAGTAGAGACGGGGTTTCACCATGTCAGCCAGGATGGTCTCGATCTCCTGACCTCGTGATCCACCCGCCTTGGCCTCCCAAAGTGCTGTGATTATAGGCGTGAACCCCTGCTTCTTGAAGCCGGGGCTGTTTCTAGGGACAGCTTCCCCAGGATGCCTTTGGCTCTGCAGCTGGGAGATCCAGCAACCTCCGGGACACGGCGGGGCAAAGCTGTGCACGGGGCACGGGGCAGGGGCGCGGGCTCCCTTCCCCCCACCCTCTGTGGCCCGGCCTGCCATGCAGAGCCGGGGCCTGCACTGAGGAGCGCGTGTGCCCCTTCCAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAG +>ENSE00003699796 +GTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAG +>ENSE00003701636 +GTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAG +>ENSE00003701891 +TGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACG +>ENSE00003696062 +TGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACG +>ENSE00003700534 +TGAGCCAGCACCCCGGGGTCCT +>ENSE00003698226 +GGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAG +>ENSE00003697832 +GGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAG +>ENSE00003700833 +GTGTGCTGAGGACCACGAAGGCGGTCTGTTAGCTTTGGAGCCGATGCCGACTTTTGGGAAGGGGCTGGACCTCCGCAGAGCAGCTGAGGAAGCATTTGAAGTTAAAGATGTGCTTAATTCCACCTTAGATTCTGAGGCTTTAAAACATACACTGTGCAGGCAGGCTAAGAACCAG +>ENSE00003698886 +GTGTGCTGAGGACCACGAAGGCGGTCTGTTAGCTTTGGAGCCGATGCCGACTTTTGGGAAGGGGCTGGACCTCCGCAGAGCAGCTGAGGAAGCATTTGAAGTTAAAGATGTGCTTAATTCCACCTTAGATTCTGAGGCTTTAAAACATACACTGTGCAGGCAGGCTAAGAACCAG +>ENSE00002081080 +GCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAATCAGCCAGTGGGCAGGTGGACGCTCTGCTGAGACAGAAGCTGGTGGCCACTGCCGGGTGCCCGCGTGGGGTCGCGGAAGGGAATGGATAGACTGGTGTGCTCAAAAGAGAGAGATCACTCAAATGATTTTTATAATGAAATGACAAGAATAACCCTTTTGGTAACCGTATTGACTGCAGAGTCTATTTAAGCATGTGGTTTTAAAAATAGACAGTATTTTTTAAAAATCAAAAAATGACTTGCAAAT +>ENSE00002068021 +GCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCT +>ENSE00001759023 +GCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAATCAGCCAGTGGGCAGGTGGACGCTCTGCTGAGACAGAAGCTGGTGGCCACTGCCGGGTGCCCGCGTGGGGTCGCGGAAGGGAATGGATAGACTGGTGTGCTCAAAAGAGAGAGATCACTCAAATGATTTTTATAATGAAATGACAAGAATAACCCTTTTGGTAACCGTATTGACTGCAGAGTCTATTTAAGCATGTGGTTTTAAAAATAGACAGTATTTTTTAAAAATCAAAAAATGACTTGCAAATTGTTTTTTAAAAGTAATTTTGCATTGCTTTGAAATTTGAGCTCATTTGCAAACCCGAGTCTGCCTGGGAACCCGCACTGTGCCTGGGTGTATTCTTTATACTGTAGATAATGGAGAAATTTTCTATCTCTGTCCCTATTTGTATAAGCCAAGGTGATGCTGGGTGCCCCGAGGCAGAACAAGAGGCGCGGGGCCACACCCGTGAACCATGCAGACGGCCGAAGAAGTCTTAGGCAGGGCGCCCTGGGCTGCAGGCCTGCCCGAGGCTGGGATGGGAAGTGTGCCTGCCCTCGTGTGACATGGAATTGGTGTCAGGACCGCCACGTGGCCTTCAGAGGAATCCACAGGTCCCCACCCAAGATCCCTCAATTATATGGGGAAGTCGAGGGCCTGTGGCTTGGATCCGCCATGCAGAGATGTGGCCGGGCACCCATCTTCCTTCCCTCCTCTGTCCCTGCCTCGGCCACCCCACGCGGGAACCCAGCGCCGTCCTCTGAAGGCAGGGCCTTGGCCACGTCCTGGGTCTCCCACCTCCCACCTGACCCCAGCGGCTCCGGTGTCCTCCACGTGGCTGCCCTGGGGAGCAATCCCAGCGGATCGCTCCGGGCCACCAAGCCGCACCTGTGCCTGAGACTCCGGATGGACGACACAGTCGTCACGTCGCTCTTCCTGCGGGTTCTTGGCGAGACACAGCTTGAGAACAGAAGGGCGTCGGGGGAACCTGCCGCAAGGAGCAGAGACAGCACAGCCCCCCGGGCCCAGCCGCCTCCCTCTCTTGGGACGCAACTTCTTCCCCACTCGGATGGGCTTTAAATTATTCCCATAGGGGCCAATTTCAAATAATAATTTTTTTCCCTGATGGAATTTACCTTAATCTGTATATAACTTGTAATTTTTTCTAATTCATTTCTTTTCTTATTTTATTTCCTCCTTAACAGTATTTTTGGCATTAGACATTCTTATTGTGAAGAAATAATGTTAATATAAGTATCTGGTGAAGGACCAAAACCGTGTGATAAGGTTGTGTGTCGTGTGGGAGTGGGGCGATTTTTTATGTGCCAAATACCCCCGTCCCCCCCATGAATCCTGCTGTCCCTGCTGCCGTTTACCAGACAATCATATGTTTTTGTTAAATTTGCGTTTCAGTTACATTTGCATTTAAGACAAGTGTTCTATTTATTTCTTGTATTGTTTGGAAGAAAAAATGATGATAGAGTCCCAAAAAGAAGAGAAAAAAAATGCCCAAGTTGCCCTTTAAAAAAAAAGAGCGTAAATACAAACAGGAGTGGTGCAAGCCGCCTTGGTGTGGGTTTGTGTCACGTGTGGACATCTCCTCAGGCTTTGTGTCACGCGTGGACATCTCCTCAGGCTGTCCCCAGCGGTGACGGGAGGTGTCCTGGCTGCTCCAGGACAAAAGACAATCGTCTCTGTGGGTGCCGGGTGGTCCAGGCTTGCACTGAAGACGTGCCACGGGGAGGCTCCTGCAGGAGGCTCAACCCGACGGATCACAGTGAAAGGGATTCCTCCCACGCCAGATCTGCACAACGAGGCAAGACAGGACCCACCTGTGCGTGCGCTGGGGCCATGGGGTGGCCCCGCCGGGGCAGCGGGGGAGCTGCCTGCAGAAGAGCCAGCTGGCGTGTCGGGAAGGATCCAGGATCTGCAAACACAACTGCTCAGGCCTTCTCACGCGTTTCCACAACATCCCCTGGGTCAGACCCACCAGGTACCCCGTAGGAATTTCCAGTTTCCCTTGATCTAGATGGGATTCTTATAAAAATTCAACCTCAGACATAAACACCCCATTTCTGTAAACCCAAATTATATGGTTTCTTCTGCGAAAGAGTAAGGTGTGTGCTTTTTTTTTTTTGCAATATGACCCCGTCTCTCTGAAGTGGGACATTCGGACGGATGGAGCCCTCAGCGTGTCTTTTCAGCAGGAGCAGAACCGATGAGAGCCGCCCTTACCGTTGGTCTCCGGATCCCCCAGTCCCATCCCGCCGTTTTCGGCTGTCTTCCTAACCGTCCTGTCTTCTCTTGGCGCTCTTTCCTTCCACCTTTCCCAAGAGTCCTGGTTGCACGTTTTAAGTCATATATTTTCGTCCCCCTGAAAATGATGGCAAGCCCAGTTTCTCCTGAGCATTCAGACCCCCAGGCCCCAGCACTTGGCGTTTTCAGGAGGCCCTGTTCTTAGAGCCCCTGACAAAGGCAGCACTTATTTCCTGGGCTGGTGCGCCCCAAAACACGGCCCCGACACTTAGTGTGGCCCCAGGCCCCAGCGAGCCTCGCCCTCCCAGTTTTGCTCTGCCCAGCAGTGTTGGTGCCCAGAGATGACAAGGGCCAGGGAGCCTGGCCCGGGTGTGAGAATTCAGAGATTCTGGCCTCCAGCTGTCACCACACCGTAACGGGGCCATGTAACTGTGCAGCATGGACAGGGATGCGACGGGGCAGCTGGCTGTGTCCATGGCCAGGTGGCCAGGGTCAGGGCTGCAAGCCAGGGGTCCAGGGCCCTTCCGTTCAGCCCAAATGCTGCCCCAATGCTAACTCCTTGGATTGTCAACCCCCATCCCCCAAATGGAAATTCCGAAGGAGGCCTCCTCGCACCTGCCCTCCGCTGCTCCTCAGACCCCAGCCCCCAGCGAGCCGACGTCCCCACCCGTTCCTGCTCTCATCCCCAGGTTGGGCACGTGGGGTTCCTCCTCTGTGGGCCTGGCAGACCCTTCATGAGTGGGACCCAAGATATCACTGACTTCAACCCAGAGGATCGAGCCCCTGCACCCTGCCTGGGGCCCTGGGGTGTGGAGCAGTGGCTGGGGTGGGCGTGGTGTGGCCTGAGAGACTGCCCAGCTGGAGAGGCCTTCCTTTACAAGGCCACGCGTGCAGCTGTCCCATCCAGACCCCGACTGGCCAAGACCTCCACGTCCCCAGAGTCCAGCCCTGGAAATTCCAAGGGCCCTGGCGTCCTCTGCCTTCCCCGCTTCCCCATGAGCGTCTGCAAAACACTTGCCTGAATACATATCACGTATTTTAGACTCGAAGCCTCAAAGCACTGGATTGTGGTCCCCTGCCCCCTCTGTCCCGTCCCCCTGCCCAAGTGACTGAAACCTACTGAGCTATATTCACTGTGCTGTCCTAGGGGGAGGGAGAGCAGAGCTCGCCCCTGCACTGCAGCCTTGTGGGGGAGGGCAAGGCTCTCCTCCCAGCCAGGGACGCCAGGACATAGCTGCTCCTGGTCAGTGGAGGTCAGCCGGGTATCAAAAGCCATGAAACTGTGTCTCTGTAGCAATGAGTGATACTGTGACAAAACCATCCTTGCATTCTTCCTAGAAGAGTTCCTCTGCTCCTTCCATTCCATTTTTGTGTTTGTTTTGTTCTTTTCTGTCACTGATCCGTATTACCACTTTTGGAAAAAAATAAATAAATAAATAAATAAAAGGCAGCTTGAGTTTCCAAACGTGTGATTCACTTGTGAACAAAAGTCATTCTAACAATTGCCTTCAGCGTCACGTGCATTGCCACTGCGCTTTCGGCACGAGGGATGCTGAGCCCTGGTGTCAGAGTCGTAATTTAAAGCGTGTGTGTATATGGACTTTGTCCCTTAAGGTCGATATAAAGAATCCTCGCAGAATCACAGACCTGTGCCGCCCGCCACCTTCTGCCATTGTTACATTACAGATTTGGTTTAGTTTTGTTTTGTTTTGTTTTTTCTTTTAGAACTGTATAGTATTGAAAAAGAAATCAAATGTAAATGTCTGGTTTTCATATAATGTTTAAAAAGACCATTGAGAAGGAGGCTGGCGCTCGCCCCATGTCCCCCTTGATTGTAAATTGCTTCTGTTCTGTTTATAAGTAAACTGTGCATGACTCCTGCTTAGCGGTCATTATCGTGTCTGTTGGTGAAATTTTTATTAAAAGGAAAATTCTGTAGATGCACTTATTGAATATGTGATTAGGATCTACGTCTGAGACTAGGAGTCCTGAACTGCTGACGCGAAAGAGGCGCAGTTCCCAATTAATACGGAAATCGCTGTGGGAGAAGAATGAAATAAGACGTGAAGTGTAGGAAATCATGAAAAGAACAATTTTGCAAATTGCATTCTGATGCTTGTGATGAACACAAATGTACTTGTGTAGAGACATTTCCTTAAGAGAAAGCCTAGGAGAAGCCGATTTGGAGGTTAATGCTGTAGAATAGGACTGTATACCAAATGTAATCTTTCCAATGCTCCAATGAATTTATACATGAGATTGATATGCAATAAATCTGTGTGCTTTTCTAA +>ENSE00001875784 +GCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAA +>ENSE00001477317 +GCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAATCAGCCAGTGGGCAGGTGGACGCTCTGCTGAGACAGAAGCTGGTGGCCACTGCCGGGTGCCCGCGTGGGGTCGCGGAAGGGAATGGATAGACTGGTGTGCTCAAAAGAGAGAGATCACTCAAATGATTTTTATAATGAAATGACAAGAATAACCCTTTTGGTAACCGTATTGACTGCAGAGTCTATTTAAGCATGTGG +>ENSE00001477303 +GGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAATCAGCCAGTGGGCAGGTGGACGCTCTGCTGAGACAGAAGCTGGTGGCCACTGCCGGGTGCCCGCGTGGGGTCGCGGAAGGGAATGGATAGACTGGTGTGCTCAAAAGAGAGAGATCACTCAAATGATTTTTATAATGAAATGACAAGAATAACCCTTTTGGTAACCGTATTGACTGCAGAGTCTATTTAAGCATGTGGTTTTAAAAATAGACAGTATTTTTTAAAAATCAAAAAATGACTTGCAAATTGTTTTTTAAAAGTAATTTTGCATTGCTTTGAAATTTGAGCTCATTTGCAAACCCGAGTCTGCCTGGGAACCCGCACTGTGCCTGGGTGTATTCTTTATACTGTAGATAATGGAGAAATTTTCTATCTCTGTCCCTATTTGTATAAGCCAAGGTGATGCTGGGTGCCCCGAGGCAGAACAAGAGGCGCGGGGCCACACCCGTGAACCATGCAGACGGCCGAAGAAGTCTTAGGCAGGGCGCCCTGGGCTGCAGGCCTGCCCGAGGCTGGGATGGGAAGTGTGCCTGCCCTCGTGTGACATGGAATTGGTGTCAGGACCGCCACGTGGCCTTCAGAGGAATCCACAGGTCCCCACCCAAGATCCCTCAATTATATGGGGAAGTCGAGGGCCTGTGGCTTGGATCCGCCATGCAGAGATGTGGCCGGGCACCCATCTTCCTTCCCTCCTCTGTCCCTGCCTCGGCCACCCCACGCGGGAACCCAGCGCCGTCCTCTGAAGGCAGGGCCTTGGCCACGTCCTGGGTCTCCCACCTCCCACCTGACCCCAGCGGCTCCGGTGTCCTCCACGTGGCTGCCCTGGGGAGCAATCCCAGCGGATCGCTCCGGGCCACCAAGCCGCACCTGTGCCTGAGACTCCGGATGGACGACACAGTCGTCACGTCGCTCTTCCTGCGGGTTCTTGGCGAGACACAGCTTGAGAACAGAAGGGCGTCGGGGGAACCTGCCGCAAGGAGCAGAGACAGCACAGCCCCCCGGGCCCAGCCGCCTCCCTCTCTTGGGACGCAACTTCTTCCCCACTCGGATGGGCTTTAAATTATTCCCATAGGGGCCAATTTCAAATAATAATTTTTTTCCCTGATGGAATTTACCTTAATCTGTATATAACTTGTAATTTTTTCTAATTCATTTCTTTTCTTATTTTATTTCCTCCTTAACAGTATTTTTGGCATTAGACATTCTTATTGTGAAGAAATAATGTTAATATAAGTATCTGGTGAAGGACCAAAACCGTGTGATAAGGTTGTGTGTCGTGTGGGAGTGGGGCGATTTTTTATGTGCCAAATACCCCCGTCCCCCCCA diff --git a/pygtftk/data/mini_real_10M/expected_sequence_rev_comp.fa b/pygtftk/data/mini_real_10M/expected_sequence_rev_comp.fa new file mode 100644 index 00000000..6e4095ff --- /dev/null +++ b/pygtftk/data/mini_real_10M/expected_sequence_rev_comp.fa @@ -0,0 +1,136 @@ +>ENST00000624697 +CGGCCTCACGCGTCCGTGCAGCGGAGGCTTCCTGAGCCCCCTGGAGAGCCTGGCCTGGGCCCGGGTGTGGAGACCCTCCCGGGCTTTCAATCCGGGCAGGAGGCAGATGGCAGACTCAGCAGTCACGTAAGAGAACCGAATTAGGAATCGCTTAATTCTGAAAGTCTGGTGAGAAGACACGGCGAGAATCGGGGTCCAGCACAGATGATGGCGACAGCGGAGAAGGGAAGGGCTGGGACCTGACGGTGAAGATGCTGGCGGGCAACGAATTCCAGGTGTCCCTGAGCAGCTCCATGTCGGTGTCAGAGCTGAAGGCGCAGATCACCCAGAAGATCGGCGTGCACGCCTTCCAGCAGCGTCTGGCTGTCCACCCGAGCGGTGTGGCGCTGCAGGACAGGGTCCCCCTTGCCAGCCAGGGCCTGGGCCCCGGCAGCACGGTCCTGCTGGTGGTGGACAAATGCGACGAACCTCTGAGCATCCTGGTGAGGAATAACAAGGGCCGCAGCAGCACCTACGAGGTACGGCTGACGCAGACCGTGGCCCACCTGAAGCAGCAAGTGAGCGGGCTGGAGGGTGTGCAGGACGACCTGTTCTGGCTGACCTTCGAGGGGAAGCCCCTGGAGGACCAGCTCCCGCTGGGGGAGTACGGCCTCAAGCCCCTGAGCACCGTGTTCATGAATCTGCGCCTGCGGGGAGGCGGCACAGAGCCTGGCGGGCGGAGCTAAGGGCCTCCACCAGCATCCGAGCAGGATCAAGGGCCGGAAATAAAGGCTGTTGTAAAGAGAAA +>ENST00000624652 +ACGCGTCCGTGCAGCGGAGGCTTCCTGAGCCCCCTGGAGAGCCTGGCCTGGGCCCGGGTGTGGAGACCCTCCCGGGCTTTCAATCCGGGCAGGAGGCAGATGGCAGACTCAGCAGTCACGAATCGCTTAATTCTGAAAGTCTGGTGAGAAGACACGGCGAGAATCGGGGTCCAGCACAGATGATGGCGACAGCGGAGAAGGGAAGGGCTGGGACCTGACGGTGAAGATGCTGGCGGGCAACGAATTCCAGGTGTCCCTGAGCAGCTCCATGTCGGTGTCAGAGCTGAAGGCGCAGATCACCCAGAAGATCGGCGTGCACGCCTTCCAGCAGCGTCTGGCTGTCCACCCGAGCGGTGTGGCGCTGCAGGACAGGGTCCCCCTTGCCAGCCAGGGCCTGGGCCCCGGCAGCACGGTCCTGCTGGTGGTGGACAAATGCGACGAACCTCTGAGCATCCTGGTGAGGAATAACAAGGGCCGCAGCAGCACCTACGAGGTACGGCTGACGCAGACCGTGGCCCACCTGAAGCAGCAAGTGAGCGGGCTGGAGGGTGTGCAGGACGACCTGTTCTGGCTGACCTTCGAGGGGAAGCCCCTGGAGGACCAGCTCCCGCTGGGGGAGTACGGCCTCAAGCCCCTGAGCACCGTGTTCATGAATCT +>ENST00000379389 +CGCAGGCTCGGCGGCACGCCCCCTGACGTGTGTGCCTCAGGCTTATAATAGGGCCGGTGCTGCCTGCCGAAGCCGGCGGCTGAGAGGCAGCGAACTCATCTTTGCCAGTACAGGAGCTTGTGCCGTGGCCCACAGCCCACAGCCCACAGCCATGGGCTGGGACCTGACGGTGAAGATGCTGGCGGGCAACGAATTCCAGGTGTCCCTGAGCAGCTCCATGTCGGTGTCAGAGCTGAAGGCGCAGATCACCCAGAAGATCGGCGTGCACGCCTTCCAGCAGCGTCTGGCTGTCCACCCGAGCGGTGTGGCGCTGCAGGACAGGGTCCCCCTTGCCAGCCAGGGCCTGGGCCCCGGCAGCACGGTCCTGCTGGTGGTGGACAAATGCGACGAACCTCTGAGCATCCTGGTGAGGAATAACAAGGGCCGCAGCAGCACCTACGAGGTACGGCTGACGCAGACCGTGGCCCACCTGAAGCAGCAAGTGAGCGGGCTGGAGGGTGTGCAGGACGACCTGTTCTGGCTGACCTTCGAGGGGAAGCCCCTGGAGGACCAGCTCCCGCTGGGGGAGTACGGCCTCAAGCCCCTGAGCACCGTGTTCATGAATCTGCGCCTGCGGGGAGGCGGCACAGAGCCTGGCGGGCGGAGCTAAGGGCCTCCACCAGCATCCGAGCAGGATCAAGGGCCGGAAATAAAGGCTGTTGTAAAGAGAAA +>ENST00000338370 +CGAGGTCGGGCTTGGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGGGTCCGGGCGCCAGGCAACGCGATTCGCGCGGGGGTGAACCCGGGGAGGGGGCCGGCCTCCCCGTTCTGGGACCTTTCGGTGCGTCCGAGCGCGACACCGCCCGCGTCGGGGGCTTGGGAGCCTCGGGGCGCGAGCTGTGTTGGAAGCAAAGTCCTCCTTGTGGGTTGGGGTGGCGGAGGGAGAAGGGAAGCGAGGGTCGCGGCGGGACCAGACGCCCCAGTCCCGGCCCGCCCGCGACTACTGAAGGCGCTGCCGCCTGACCTGAACGGGCACTTGTGTTCCAGCTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAGGCGGCCGCCCGCCTTGGCCCGTCTCTGGAGTGCTGGGCAGCCGGGTCTGCGGGCCCCTTTACAGCACATCGCCGGCCGGCCCAGGTAGGGCGGCCTCTCTCCCTCGCAAGGGGGCCCAGCTGGAGCTGGAGGAGATGCTGGTCCCCAGGAAGATGTCCGTCAGCCCCCTGGAGAGCTGGCTCACGGCCCGCTGCTTCCTGCCCAGACTGGATACCGGGACCGCAGGGACTGTGGCTCCACCGCAATCCTACCAGTGTCCGCCCAGCCAGATAGGGGAAGGGGCCGAGCAGGGGGATGAAGGCGTCGCGGATGCGCCTCAAATTCAGTGCAAAAACGTGCTGAAGATCCGCCGGCGGAAGATGAACCACCACAAGTACCGGAAGCTGGTGAAGAAGACGCGGTTCCTGCGGAGGAAGGTCCAGGAGGGACGCCTGAGACGCAAGCAGATCAAGTTCGAGAAAGACCTGAGGCGCATCTGGCTGAAGGCGGGGCTAAAGGAAGCCCCCGAAGGCTGGCAGACCCCCAAGATCTACCTGCGGGGCAAATGAGTCTGGCGCCGCCCTTCCCGCCCGTTGCTGCTGTGATCCGTAGTAATAAATTCTCAGAGGACTCAGCCTTT +>ENST00000338338 +GGAATCCGGCCCCTGGGTGGTCCGGAAACGATTCTGGACCTGCGGGTATATCCAGGGCCCGCACCCCCTGGGATTGTGGGAAATGTAGTTTTTTGCCTCCGTAAGGGACCAGGCGGAGCTGAGGAACCGCGCGAGGACTGGGACCGTGATTCCACTAACCGGAAACCGTCGCCTTTCGGGCCCGGCGGGGCCTGAGCCAATGCAGAATCGGGGGCCGCGAGGACGCCAGCGGGCGCTGTGCGTAGGAACCGCCGGGTGGCCGCTGCCGATCGGGGCCGACTTGGGGACGGACCGGAAGTGCCCGAGGGCGGCCGCAGAACGGTCAATTTGAGCCGCGTCGAGCTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAGGCGGCCGCCCGCCTTGGCCCGTCTCTGGAGTGCTGGGCAGCCGGGTCTGCGGGCCCCTTTACAGCACATCGCCGGCCGGCCCAGGTAGGGCGGCCTCTCTCCCTCGCAAGGGGGCCCAGCTGGAGCTGGAGGAGATGCTGGTCCCCAGGAAGATGTCCGTCAGCCCCCTGGAGAGCTGGCTCACGGCCCGCTGCTTCCTGCCCAGACTGGATACCGGGACCGCAGGGACTGTGGCTCCACCGCAATCCTACCAGTGTCCGCCCAGCCAGATAGGGGAAGGGGCCGAGCAGGGGGATGAAGGCGTCGCGGATGCGCCTCAAATTCAGTGCAAAAACGTGCTGAAGATCCGCCGGCGGAAGATGAACCACCACAAGTACCGGAAGCTGGTGAAGAAGACGCGGTTCCTGCGGAGGAAGGTCCAGGAGGGACGCCTGAGACGCAAGCAGATCAAGTTCGAGAAAGACCTGAGGCGCATCTGGCTGAAGGCGGGGCTAAAGGAAGCCCCCGAAGGCTGGCAGACCCCCAAGATCTACCTGCGGGGCAAATGAGTCTGGCGCCGCCCTTCCCGCCCGTTGCTGCTGTGATCCGTAGTAATAAATTCTCAGAGGACTCAGCCTTT +>ENST00000321751 +TTTGAGCCGCGTCGAGGTCGGGCTTGGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGGCTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAGGCGGCCGCCCGCCTTGGCCCGTCTCTGGAGTGCTGGGCAGCCGGGTCTGCGGGCCCCTTTACAGCACATCGCCGGCCGGCCCAGGTAGGGCGGCCTCTCTCCCTCGCAAGGGGGCCCAGCTGGAGCTGGAGGAGATGCTGGTCCCCAGGAAGATGTCCGTCAGCCCCCTGGAGAGCTGGCTCACGGCCCGCTGCTTCCTGCCCAGACTGGATACCGGGACCGCAGGGACTGTGGCTCCACCGCAATCCTACCAGTGTCCGCCCAGCCAGATAGGGGAAGGGGCCGAGCAGGGGGATGAAGGCGTCGCGGATGCGCCTCAAATTCAGTGCAAAAACGTGCTGAAGATCCGCCGGCGGAAGATGAACCACCACAAGTACCGGAAGCTGGTGAAGAAGACGCGGTTCCTGCGGAGGAAGGTCCAGGAGGGACGCCTGAGACGCAAGCAGATCAAGTTCGAGAAAGACCTGAGGCGCATCTGGCTGAAGGCGGGGCTAAAGGAAGCCCCCGAAGGCTGGCAGACCCCCAAGATCTACCTGCGGGGCAAATGAGTCTGGCGCCGCCCTTCCCGCCCGTTGCTGCTGTGATCCGTAGTAATAAATTCTCAGAGGACTCAGCCT +>ENST00000378853 +TCAATTTGAGCCGCGTCGAGGTCGGGCTTGGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGGGTCCGGGCGCCAGGCAACGCGATTCGCGCGGGGGTGAACCCGGGGAGGGGGCCGGCCTCCCCGTTCTGGGACCTTTCGCTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAGGCGGCCGCCCGCCTTGGCCCGTCTCTGGAGTGCTGGGCAGCCGGGTCTGCGGGCCCCTTTACAGCACATCGCCGGCCGGCCCAGGTAGGGCGGCCTCTCTCCCTCGCAAGGGGGCCCAGCTGGAGCTGGAGGAGATGCTGGTCCCCAGGAAGATGTCCGTCAGCCCCCTGGAGAGCTGGCTCACGGCCCGCTGCTTCCTGCCCAGACTGGATACCGGGACCGCAGGGACTGTGGCTCCACCGCAATCCTACCAGTGTCCGCCCAGCCAGATAGGGGAAGGGGCCGAGCAGGGGGATGAAGGCGTCGCGGATGCGCCTCAAATTCAGTGCAAAAACGTGCTGAAGATCCGCCGGCGGAAGATGAACCACCACAAGTACCGGAAGCTGGTGAAGAAGACGCGGTTCCTGCGGAGGAAGGTCCAGGAGGGACGCCTGAGACGCAAGCAGATCAAGTTCGAGAAAGACCTGAGGCGCATCTGGCTGAAGGCGGGGCTAAAGGAAGCCCCCGAAGGCTGGCAGACCCCCAAGATCTACCTGCGGGGCAAATGAGTCTGGCGCCGCCCTTCCCGCCCGTTGCTGCTGTGATCCGTAGTAATAAATTCTCAGAGGACTC +>ENST00000489799 +GGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGGGTCCGGGCGCCAGGCAACGCGATTCGCGCGGGGGTGAACCCGGGGAGGGGGCCGGCCTCCCCGTTCTGGGACCTTTCGCTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAGGTAGGAAGCCGCGCGGGGGCGGATGGGAGGATGCACACCTGGTTAGGAGTGCGGGTCTCAGCAGCTCCGCTGGGGCAGGGCCGGTGGCCACACACACACTCTTTCCCCTCTAAGCTTCCGATGCTCACAGAGGGAACCTCAGGGGTTCAGGCCAGGAATGAGGTGCGGGGGATCCTCGCTGGGACGAACCTGCTGCTCCTCAACCCGACGGGCCTGTGTGGTCTCGCGAGCGGTGACCGTGGCGTCTGGTTTTCTGCAGGCGGCCGCCCGCCTTGGCCCGTCTCTGGAGTGCTGGGCAGCCGGGTCTGCGGGCCCCTTTACAGCACATCGCCGGCCGGCCCAGGTAGGGCGGCCTCTCTCCCTCGCAAGGGGGCCCAGCTGGAGCTGGAGGAGATGCTGGTCCCCAGGAAGATGTCCGTCAGCCCCCTGGAGAGCTGGCTCACGGCCCGCTGCTTCCTGCC +>ENST00000496905 +GTCGAGGTCGGGCTTGGGAAGGGTCAGCGGGAGGCCTGAGGGCGCCGGGCGCTGCGGCAGGCGGGCCCGGGGTCCAGCCGAGAGGGTCCGGGCGCCAGGCAACGCGATTCGCGCGGGGGTGAACCCGGGGAGGGGGCCGGCCTCCCCGTTCTGGGACCTTTCGGTGCGTCCGAGCGCGACACCGCCCGCGTCGGGGGCTTGGGAGCCTCGGGGCGCGAGCTGTGTTGGAAGCAAAGTCCTCCTTGTGGGTTGGGGTGGCGGAGGGAGAAGGGAAGCGAGGGTCGCGGCGGGACCAGACGCCCCAGTCCCGGCCCGCCCGCGACTACTGAAGGCGCTGCCGCCTGACCTGAACGGGCACTTGTGTTCCAGCTCCCCTGGGACCTGTGGCCGCCGCCCACAGACCATGCTCCTGGGGCGCCTGACTTCCCAGCTGTTGAGGGCCGTTCCTTGGGCAGCTTCCGATGCTCACAGAGGGAACCTCAGGGGTTCAGGCCAGGAATGAGGTGCGGGGGATCCTCGCTGGGACGAACCTGCTGCTCCTCAACCCGACGGGCCTGTGTGGTCTCGCGAGCGGTGACCGTGGCGTCTGGTTTTCTGCAGGCGGCCGC +>ENST00000378602 +TCCGCTGTCGCCCAGTCCCGGCCGCTGGCGGGAACTGACCTGGAGCAAGCAGGACCTTCCCTCCCACCTCTCCCGCCTGGCCTCCGCGGGAGTCCCCTACGATCCCGCTCAGCAGTGGGGCACTCGCTGAGGACAGCGAGTCCTGGGAGTGAGCCCAAGGCCACCCCTGGCCAGCCCAGGAGAGATAGCCAGGGCAGGCCCAGCAGCCCGAGGCCAGGCTCTGGCCACGGCGGTCTCCGACATGGAGAGACATTGTCTGCTTTTTATCCTGTTAACCTGTCTTCGGTGGTTGTGCCACGACATTCCCCAGGGTGCAGGTGCCCGGTGGCCGAGGGTCAGTCCAGTGGTAGAGCCTTGCTCTCCTAGGCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACAGCTGGTTGTGTCCGGTTCTGCTGCCTCCGGAAGCAGGCACAGGCCCAGCCACATCTGCCACCAGCACGGCAGCCCTGCGACGTGGCAGTCATCCCTATGGACAGTGACAGCCCTGTACACAGCACTGTGACCTCCTACAGCTCCGTGCAGTACCCACTGGGCATGCGGTTGCCCCTGCCCTTTGGGGAGCTGGACCTGGACTCCATGGCTCCTCCTGCCTACAGCCTGTACACCCCGGAGCCTCCACCCTCCTACGATGAAGCTGTCAAGATGGCCAAGCCCAGAGAGGAAGGACCAGCACTCTCCCAGAAACCCAGCCCTCTCCTTGGGGCCTCGGGCCTAGAGACCACTCCAGTGCCCCAGGAGTCGGGCCCCAATACTCAACTACCACCTTGTAGCCCTGGTGCCCCTTGAAGGAGGTAGGAGAACGGACCAGAGCTTGGAGAACTAATGCTTGGAGCCAAGGGCCCCAGCCCACCCCACCGTCCCACACATTGCTGTGGCCCCAACCTCGGTGCCATGTTACACCGGCCCCTGGCGTCACCCACTAGGCAGGCTGCTGCTTTCAGCCTCAGCCCCTGGCCCAGCCCCAGCAGGCCCTCAGCCTGGAAGAGGCCCCTTGGGCCTAAGCCTCGGGTGGGAGCTCAGGGCCACCTGTGACGTCTGCATCTTCTTGGAGAGAGAATAAAGTTTGTATTTAAGTGGT +>ENST00000310991 +CTCAGAGCATGGCCCGGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAGGTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCAGTGCCCGCCCCAGGCCCGCTGGAGCAGCCTGTGGCACGTGGGGCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACAGCTGGTTGTGTCCGGTTCTGCTGCCTCCGGAAGCAGGCACAGGCCCAGCCACATCTGCCACCAGCACGGCAGCCCTGCGACGTGGCAGTCATCCCTATGGACAGTGACAGCCCTGTACACAGCACTGTGACCTCCTACAGCTCCGTGCAGTACCCACTGGGCATGCGGTTGCCCCTGCCCTTTGGGGAGCTGGACCTGGACTCCATGGCTCCTCCTGCCTACAGCCTGTACACCCCGGAGCCTCCACCCTCCTACGATGAAGCTGTCAAGATGGCCAAGCCCAGAGAGGAAGGACCAGCACTCTCCCAGAAACCCAGCCCTCTCCTTGGGGCCTCGGGCCTAGAGACCACTCCAGTGCCCCAGGAGTCGGGCCCCAATACTCAACTACCACCTTGTAGCCCTGGTGCCCCTTGAAGGAGGTAGGAGAACGGACCAGAGCTTGGAGAACTAATGCTTGGAGCCAAGGGCCCCAGCCCACCCCACCGTCCCACACATTGCTGTGGCCCCAACCTCGGTGCCATGTTACACCGGCCCCTGGCGTCACCCACTAGGCAGGCTGCTGCTTTCAGCCTCAGCCCCTGGCCCAGCCCCAGCAGGCCCTCAGCCTGGAAGAGGCCCCTTGGGCCTAAGCCTCGGGTGGGAGCTCAGGGCCACCTGTGACGTCTGCATCTTCTTGGAGAGAGAATAAAGTTTGTATTTAAGTGG +>ENST00000378598 +GGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAGGTGGGTCGGGCGGCGTTCTCTCTCGGTTCGGCCACCGCGGGGCGGGTCCCTGCTCGGACCACGCCCCTCCCGGGCTCACCCTTGTCCCCACAGGTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCAGTGCCCGCCCCAGGCCCGCTGGAGCAGCCTGTGGCACGTGGGCCTGTACACCCCGGAGCCTCCACCCTCCTACGATGAAGCTGTCAAGATGGCCAAGCCCAGAGAGGAAGGACCAGCACTCTCCCAGAAACCCAGCCCTCTCCTTGGGGCCTCGGGCCTAGAGACCACTCCAGTGCCCCAGGAGTCGGGCCCCAATACTCAACTACCACCTTGTAGCCCTGGTGCCCCTTGAAGGAGGTAGGAGAACGGACCAGAGCTTGGAGAACTAA +>ENST00000470931 +AGAGCATGGCCCGGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAGGTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCAGTAAGTCGGGGGGGAGGGAGCCGGGGCCTGGCCCCGCCCTATGGGGAGGCACGGGTGGCGAGGTCGGCCGTCCCATGCCCCGCCTGCTCCAGGTGCCGCCGTCCCCACAGGTGCCCGCCCCAGGCCCGCTGGAGCAGCCTGTGGCACGTGGGGCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACAGCTGGTTGTGTCCGGTTCTGCTGCCTCCGGAAGCAGGCACAGGCCCAGCCACATCTGCCACCAGCACGGCAGCCCTGCGACGTGGCAGTCATCCCTATGGACAGTGACAGCCCTGTACACAGCACTGTGACCTCCTACAGCTCCGTGCAGTACCCACTGGGCATGCGGTTGCCCCTGCCCTTTGGGGAGCTGGACCTGGACTCCATGGCTCCTCCTGCCTACAGCCTGTACACCCCGGAGCCTCCACCCTCCTACGATGAAGCTGTCAAGATGGCCAAGCCCAGAGAGGAAGGACCAGCACTCTCCCAGAAACCCAGCCCTCTCCTTGGGGCCTCGGGCCTAGAGACCACTCCAGTGCC +>ENST00000602604 +GAGCATGGCCCGGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAGGTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCAGTGCCCGCCCCAGGCCCGCTGGAGCAGCCTGTGGCACGTGGGGTAAGTGGAGGCCGCGGCGGAGCCGTGCGTCCGACGGTTCTGGGGCGGGGGTCACCGGGGCCAGGCCCGCCAGGCCCTTACCTCACCAGGCCGCCTCCGCTGTCGCCCAGTCCCGGCCGCTGGCGGGAACTGACCTGGAGCAAGCAGGACCTTCCCTCCCACCTCTCCCGCCTGGCCTCCGCGGGAGTCCCCTACGATCCCGCTCAGCAGTGGGGCACTCGCTGAGGACAGCGAGTCCTGGGAGTGAGCCCAAGGCCACCCCTGGCCAGCCCAGGAGAGATAGCCAGGGCAGGCCCAGCAGCCCGAGGCCAGGCTCTGGCCACGGCGGTCTCCGACATGGAGAGACATTGTCTGCTTTTTATCCTGTTAACCTGTCTTCGGTGGTTGTGCCACGACATTCCCCAGGGTGCAGGTGCCCGGTGGCCGAGGGTCAGTCCAGTGGTAGAGCCTTGCTCTCCTAGGCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACAGCTGGTTGTGTCCGGTTCTGCTGCCTCCGGAAGCAGGCACAGGCCCAGCCACATCTGCCACCAGCACGGCAGCCCTGCGACGTGGCAGTCATCCCTATGGACAGTGACAGCCCTGTACACAGCACTGTGACCTCCTACAGCTCCGTGCAGTACCCACTGGGCATGCGGTTGCCCCTGCCCTTTGGGGAGCTGGACCT +>ENST00000416272 +GAGCATGGCCCGGGGGCCGCTGGCCGCCCGCGGACTGCGGCTGCTGCTGCCGCTCCTGCCGCTCCTGCCGCTCCTGCCGCTGCCGCAGGTGGGTCGGGCGGCGTTCTCTCTCGGTTCGGCCACCGCGGGGCGGGTCCCTGCTCGGACCACGCCCCTCCCGGGCTCACCCTTGTCCCCACAGGTGGCGCTGGGCTTCGCGGACGGCAGCTGCGACCCCTCGGACCAGTGCCCGCCCCAGGCCCGCTGGAGCAGCCTGTGGCACGTGGGGCTCATCCTGCTGGCGGTCCTCCTGCTTCTGCTGTGTGGTGTCACA +>ENST00000400919 +CTCACTTCCGCCCGGCGCGGGCTTGGATGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGTACTTCAACTCCCGCCCCCACCTGTGTCCCGCTGGCTCCTAAGCTGCCCCCCTACGTGTGGGTTGCGTCTGAGATGTGGGGCAGGCGCCACTCACGGAAAAAAGGCATCAGAGGAGCTTCCACATCATCGGAACATTTTATTCCTCAGGACGCTACACGCTCACTTTCCTGGCGGAGCAGGTCAGTGCATCGAGTTCTGTTTCCGTGGAAAATGTGCACCTTGGAAACCGCATGACAGCCCCCTCGGCAGGGTCCCCGCGGATCCGCCGCGACGCAGGCACAGCAGCAAGTTCCTCCAGCACGAAGCTGGCCTGCCCGGGCCCAGGTGTGAGGGACTGTTCTGCTCCCAGCAGCGCCCGCTGACGCTTCCCTCTGCGGTCTCGGCGCAAGCGTCTGTCCCTGGCCGCCCTCGGAGCCGTGCCCAGCCTGGCATGCATATGCGGTGGTTAAGGATACAGTTAAAGGGTCAATCACGCGTGTCCACGACAGAGACGCACGCGGCCTCACACCGACTCCTCGGTGGACAGCAATAATGGGTTGATATACTCAAAGCCTTCGAACTCTGACTGGTCGATCCTCTTTATGGCATCCCTGTGGGCAAAGGTGGCAGGGGGGAGGGGGGTGACCGTGTGTTCATTCCCTTGGGGGAAGCGGAGTCACGTTCGCATAAGAATCCTCCCCCAACGCCCACTGGAGAGATGACACCAGGCGGGTGGGACTCAAGGGCAGGCTGGGTCACCAGCTGCCCAAGGTGCCGGCCTGCCATGGGGCTGCCCGAGGGGTGCTCCAGGGACCCGCACCCAGTGGGACTCACTCATCGTCTGGGGTCAGCTGCACGGGCTCGCTGGTGAACTGTGTGTCAAAGTTGTCCAGACCGTAGTCGTCTGTGATCTGTGGCTGGAATGGAGGGAGCGCCTGCTTCTTCTCCAGCTTGGAAAAACAATAGGAGAAGGGTCAGCTCCGCGCGGGCATCATCCCTACCAGATTGAGTGTTTTGCACGCACTTCAATCACAAAATGAAACAGTGAGAAAGTCAGCATTTCAATCTGCCT +>ENST00000469733 +CTTTTGTGGGGTCAGTGCCCACAGGGTTGAGCACCACGTGCCTGGCTGGGCAGTGCTCCTGCCAGGGTCCCCTTCTCCACTGTAGGAAACACGGCTGCTCCTGCAGCCGCGTCTGCTCTGCTGCATCTCCAGCTCCTGCCAGGCATGGTGTGCGCGGCCCCAAGACAGGGAGTTTCCATAGAGACAGGGTTTCACCGTGTTAGCCAGGATGGTCTCGATCTCCTGACCTCGTGATCCGCCCGCCTCGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCACGCCCGGCCCCCAGAGCCTTAGTCTCAGAATCACACCCACCCCACGCCCAGGGCGTCTGTCACAGCTTTCCAATCCATGAGCCCATCAATCGGACTGGACACAGATAAACTGGGACAGGACGCCGGGTGGCAAAGGCCGGGAGAGCTGGGCCACTCCCTCCAAAAGGCCCCAGACGCAGCTGCATCCTGGAGTCCTTCTGAGAAATGTGGGACCTGCCCCAGCTCCACCCCAGGTGAGGGGCACCAGCCAGCTCCAGAGCTGCCTACCTTCCCTGTCAGGTGCACAGGTCAGCGCCAGGCCAACCCCAGAGCGAGAACACCTGTGCTGGACTGAGCTGGAGCAGCAGGGTGGCCTGCACCGGGGCAGCGAGGGAGGCGTTGGATGGAGCCACCCCACGGCTCCTCTGTGAAGGTCTGCACGTCACTCAGAAAGTTGAAGCAAACCAAGCAGGGTTGGAGCCCACAGTTCACAGCCGGCTGCACAGGGGATGCACCAAGCACAGTTTCCTATGACAAGTGGAAACCTGTGCGCCACAGCAAAACTCCGTCACCACAGCAGCAGATGGCTCCGAAGAAGTGGAGCGTTTTCATCAGGTTCAACTTTGAAACCTCCACCATCACCATCACCAGCACCGCTGTGTCATGCTGATAACTTGAGGACAGGCAGGACAAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGTACTTCAACTCCCGCCCCCACCTGTGTCCCGCTGGCTCCTAAGCTGCCCCCCTACGTGTGGGTTGCGTCTGAGATGTGGGGCAGGCGCCACTCACGGAAAAAAGGCATCAGAGGAGCTTCCACATCATCGGAACATTTTATTCCTCAGGACGCTACACGCTCACTTTCCTGGCGGAGCAGGTCAGTGCATCGAGTTCTGTTTCCGTGGAAAATGTGCACCTTGGAAACCGCATGACAGCCCCCTCGGCAGGGTCCCCGCGGATCCGCCGCGACGCAGGCACAGCAGCAAGTTCCTCCAGCACGAAGCTGGCCTGCCCGGGCCCAGGTGTGAGGGACTGTTCTGCTCCCAGCAGCGCCCGCTGACGCTTCCCTCTGCGGTCTCGGCGCAAGCGTCTGTCCCTGGCCGCCCTCGGAGCCGTGCCCAGCCTGGCATGCATATGCGGTGGTTAAGGATACAGTTAAAGGGTCAATCACGCGTGTCCACGACAGAGACGCACGCGGCCTCACACCGACTCCTCGGTGGACAGCAATAATGGGTTGATATACTCAAAGCCTTCGAACTCTGACTGGTCGATCCTCTTTATGGCATCCCTGTGGGCAAAGGTGGCAGGGGGGAGGGGGGTGACCGTGTGTTCATTCCCTTGGGGGAAGCGGAGTCACGTTCGCATAAGAATCCTCCCCCAACGCCCACTGGAGAGATGACACCAGGCGGGTGGGACTCAAGGGCAGGCTGGGTCACCAGCTGCCCAAGGTGCCGGCCTGCCATGGGGCTGCCCGAGGGGTGCTCCAGGGACCCGCACCCAGTGGGACTCACTCATCGTCTGGGGTCAGCTGCACGGGCTCGCTGGTGAACTGTGTGTCAAAGTTGTCCAGACCGTAGTCGTCTGTGATCTGTGGCTGGAATGGAGGGAGCGCCTGCTTCTTCTCCAGCTTGGAAAAACAATAGGAGAAGGGTCAGCTCCGCGCGGGCATCATCCCTACCAGATTGAGTGTTTTGCACGCACTTCAATCACAAAATGAAACAGTGAGAAAGTCAGCATTTCAATCTG +>ENST00000414253 +CTCACTTCCGCCCGGCGCGGGCTTGGATGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGTCTTTCATGGATGTGCAAGACTTTGAATGACCCTGGCAGTCAAGGGTGAGTGTCATCCACAGGAGAGCCGGCCAGCCACGGGCTCCATGGGCAGTTGCCCCGCACCACGCCCACGCAGGCCCACTGTGCAGCCCCCAAGTCACCAGAGTTTTCGAGAACCACTTCCAAAAGACACCGTCGTGACCGGAGCCATTAGCAAATATCAGGATTTTTCAAACCACACTTCAATACATCCTTCACTTTAATTTATAAAACAAATTACTGAATATAAAAGTCTCCCCTCTGATGAGCACAGCATTACTCACATATTGTGTACAAGAACGGCCAAACTGGTAACCGGCACGCTACTGGCAACACGGCAGTATTTAGCCACCAGCCGCACAATGGGGTGGAGCGGCCCCTGAGTCATGGAGGCCTGGGGTCTCTGCGCCTGGCCAAGAGGGCTGCGTGGCAATTTCCACACCTGTGCACCAGGCCTCACTCAGAGGCATGAGGTGGCGCGACCCCCTCTCCCAGGGAGCTCAGAAGACGGCTCTGCCACACCTGACACCTGGCAGCTGGCAGCCCTGCCTCTAGGAAGCCTCAGCTCTGGACAGCTGTGCCTTCACCTGAGGGGTACTTCAACTCCCGCCCCCACCTGTGTCCCGCTGGCTCCTAAGCTGCCCCCCTACGTGTGGGTTGCGTCTGAGATGTGGGGCAGGCGCCACTCACGGAAAAAAGGCATCAGAGGAGCTTCCACATCATCGGAACATTTTATTCCTCAGGACGCTACACGCTCACTTTCCTGGCGGAGCAGGTCAGTGCATCGAGTTCTGTTTCCGTGGAAAATGTGCACCTTGGAAACCGCATGACAGCCCCCTCGGCAGGGTCCCCGCGGATCCGCCGCGACGCAGGCACAGCAGCAAGTTCCTCCAGCACGAAGCTGGCCTGCCCGGGCCCAGGTGTGAGGGACTGTTCTGCTCCCAGCAGCGCCCGCTGACGCTTCCCTCTGCGGTCTCGGCGCAAGCGTCTGTCCCTGGCCGCCCTCGGAGCCGTGCCCAGCCTGGCATGCATATGCGGTGGTTAAGGATACAGTTAAAGGGTCAATCACGCGTGTCCACGACAGAGACGCACGCGGCCTCACACCGACTCCTCGGTGGACAGCAATAATGGGTTGATATACTCAAAGCCTTCGAACTCTGACTGGTCGATCCTCTTTATGGCATCCCTGTGGGCAAAGGTGGCAGGGGGGAGGGGGGTGACCGTGTGTTCATTCCCTTGGGGGAAGCGGAGTCACGTTCGCATAAGAATCCTCCCCCAACGCCCACTGGAGAGATGACACCAGGCGGGTGGGACTCAAGGGCAGGCTGGGTCACCAGCTGCCCAAGGTGCCGGCCTGCCATGGGGCTGCCCGAGGGGTGCTCCAGGGACCCGCACCCAGTGGGACTCACTCATCGTCTGGGGTCAGCTGCACGGGCTCGCTGGTGAACTGTGTGTCAAAGTTGTCCAGACCGTAGTCGTCTGTGATCTGTGGCTGGAATGGAGGGAGCGCCTGCTTCTTCTCCAGCTTGGAAAAACAATAGGAGAAGGGTCAGCTCCGCGCGGGCATCATCCCTACCAGATTGAGTGTTTTGCACGCACTTCAATCACAAAATGAAACAGTGAGAAAGTC +>ENST00000428120 +GGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGAAGCAAAAACAGCTCGGGAATGCGAAGGCACCGGAGTCCAAAGTTGGCAGCCAACAACAACAACAACAAAAGAAAAGGCCGGGCACGGTGGCTCACGCCTGTAATCCCAGCCCTTTGAGAGGCTGAGGCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGTCTTTCATGGATGTGCAAGACTTTGAATGACCCTGGCAGTCAAGGGTGAGTGTCATCCACAGGAGAGCCGGCCAGCCACGGGCTCCATGGGCAGTTGCCCCGCACCACGCCCACGCAGGCCCACTGTGCAGCCCCCAAGTCACCAGAGTTTTCGAGAACCACTTCCAAAAGACACCGTCGTGACCGGAGCCATTAGCAAATATCAGGATTTTTCAAACCACACTTCAATACATCCTTCACTTTAATTTATAAAACAAATTACTGAATATAAAAGTCTCCCCTCTGATGAGCACAGCATTACTCACATATTGTGTACAAGAACGGCCAAACTGGTAACCGGCACGCTACTGGCAACACGGCAGTATTTAGCCACCAGCCGCACAATGGGGTGGAGCGGCCCCTGAGTCATGGAGGCCTGGGGTCTCTGCGCCTGGCCAAGAGGGCTGCGTGGCAATTTCCACACCTGTGCACCAGGCCTCACTCAGAGGCATGAGGTGGCGCGACCCCCTCTCCCAGGGAGCTCAGAAGACGGCTCTGCCACACCTGACACCTGGCAGCTGGCAGCCCTGCCTCTAGGAAGCCTCAGCTCTGGACAGCTGTGCCTTCACCTGAGGGGTACTTCAACTCCCGCCCCCACCTGTGTCCCGCTGGCTCCTAAGCTGCCCCCCTACGTGTGGGTTGCGTCTGAGATGTGGGGCAGGCGCCACTCACGGAAAAAAGGCATCAGAGGAGCTTCCACATCATCGGAACATTTTATTCCTCAGGACGCTACACGCTCACTTTCCTGGCGGAGCAGGTCAGTGCATCGAGTTCTGTTTCCGTGGAAAATGTGCACCTTGGAAACCGCATGACAGCCCCCTCGGCAGGGTCCCCGCGGATCCGCCGCGACGCAGGCACAGCAGCAAGTTCCTCCAGCACGAAGCTGGCCTGCCCGGGCCCAGGTGTGAGGGACTGTTCTGCTCCCAGCAGCGCCCGCTGACGCTTCCCTCTGCGGTCTCGGCGCAAGCGTCTGTCCCTGGCCGCCCTCGGAGCCGTGCCCAGCCTGGCATGCATATGCGGTGGTTAAGGATACAGTTAAAGGGTCAATCACGCGTGTCCACGACAGAGACGCACGCGGCCTCACACCGACTCCTCGGTGGACAGCAATAATGGGTTGATATACTCAAAGCCTTCGAACTCTGACTGGTCGATCCTCTTTATGGCATCCCTGTGGGCAAAGGTGGCAGGGGGGAGGGGGGTGACCGTGTGTTCATTCCCTTGGGGGAAGCGGAGTCACGTTCGCATAAGAATCCTCCCCCAACGCCCACTGGAGAGATGACACCAGGCGGGTGGGACTCAAGGGCAGGCTGGGTCACCAGCTGCCCAAGGTGCCGGCCTGCCATGGGGCTGCCCGAGGGGTGCTCCAGGGACCCGCACCCAGTGGGACTCACTCATCGTCTGGGGTCAGCTGCACGGGCTCGCTGGTGAACTGTGTGTCAAAGTTGTCCAGACCGTAGTCGTCTGTGATCTGTGGCTGGAATGGAGGGAGCGCCTGCTTCTTCTCCAGCTTGGAAAAACAATAGGAGAAGGGTCAGCTCCGCGCGGGCATCATCCCTACCAGATTGAGTGTTTTGCACGCACTTCAATCACAAAATGAAACAGTGAGAAAGTC +>ENST00000400918 +GGATGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGTACTTCAACTCCCGCCCCCACCTGTGTCCCGCTGGCTCCTAAGCTGCCCCCCTACGTGTGGGTTGCGTCTGAGATGTGGGGCAGGCGCCACTCACGGAAAAAAGGCATCAGAGGAGCTTCCACATCATCGGAACATTTTATTCCTCAGGACGCTACACGCTCACTTTCCTGGCGGAGCAGGTCAGTGCATCGAGTTCTGTTTCCGTGGAAAATGTGCACCTTGGAAACCGCATGACAGCCCCCTCGGCAGGGTCCCCGCGGATCCGCCGCGACGCAGGCACAGCAGCAAGTTCCTCCAGCACGAAGCTGGCCTGCCCGGGCCCAGGTGTGAGGGACTG +>ENST00000497675 +CTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGTGAGTAGGCCACCCCTGCGCCCGGCCCGGTTATCCATCCGTGTTTGGAAACCACAGCCGTTCAGAAGGTCAAGAGGTGGCCGAGCTCAGCGCTGGCTTTTAAAGCCCTGTTTCACACTGGAAAGGTGGCCCAGTGCTGTGGCCTGGCATGTCCAGGTGGCTCTCTGTCACGGGTCTGGGGTCCACCTGCTTGCCGTGCTCTGTGGGCAGGGCAGGCTGGGGGCCCACAGAACAGCACAGAAGGAAGGCTGGGAGCACTGGCCCCGGGTCCACCTGGCCATCCTGGAATCTGGTGGCACCAGCGTCCCCAGGCCCAGAGCACAGGAACACCTTCCCGAGAGTGCGTCATGGGTTTTAAAAATGAAGATCGTCTTTTTTGTCTGGAGATGCTTTTTCTTATTTTTGAAACCCAACGTATATTTTTATGTATTTTTTAAGTAAAGGGGAATGGAACCCAGTTTTGCTAACAAGATAACCCAAACTGCCCAGTGCCTGGCCTTGTGTCTGGCGACCTCTGGGCCCTTGGCCTCCGGAGCAGGTCCTGGGGCTGGGGTGGTGTGAATGATGCTGGTTCGTAACTTTTGGTTGAGTTAATGGGCGGCAGGTTTCAGAGCTTATGGAGACCAGGTCCTTCAGTCATGCCTGATGCCCCTGGTCTTCCAGAAGCAAAAACAGCTCGGGAATGCGAAGGCACCGGAGTCCAAAGTTGGCAGCCAACAACAACAACAACAAAAGAAAAGGCCGGGCACGGTGGCTCACGCCTGTAATCCCAGCCCTTTGAGAGGCTGAGGCAGGTGGGTTGCTGGAGCCCAGGAGTTTGAGACCAGCCTGGGCAACATGGCAAGATCCCATCTTTACATGCCTGGGCGTGGTGGCGCGTGCCTGTGGTCCTAGCTACTCTGGAGGCTGAAGTGGGAGGATTCCCTTGAGCCAGGAATTGGAGGCTGTAGTGAAGTATGATTGCACCACTGCACTCCAGCCTGGGTGACAGAGTAAGACCCTGAATCACGGACAGAGGGTACTGTTGGGAGCCCTGGGGAGAAATCCATGCTCTTGGCTGAAGCTCTGAGATCCTTGTTGCTGTCAGGGTGCTGCCCCCCGCCCCCCGGGGAGGGGCTTTTGTCTTTGCATCGCCTGCTTTTCCAGATAGTCTAAAAAAAGACTTCTGAAGACAAGGACGTTCACGAGGAAAAACTTGCCATTTTGAGCTTTTTAAGCAGTTGCTGAAAGCTTGGCAGACTGCCTCAATTTTTCCTAAGTAGGCGTCAATGAAGTCAGGTCCAGGCCTTGGTGTGTCTGGAATGCTTCAAGCACATTCGAACACTTGATCGTAAGGGAGAGCCGGTACTTTGGAACCGGAACTCACCCGAGGCTGTGGCCACCGCATGGGCAGGCTAGCTGGGGGACAAGCCCCATATCTTTGGGAACAAGGGTTTGCACAGCCACCCTGGGATGCCCTGGGACTCCTGACCGCACAGGACCCCAGCAGGGAGGCCGCCTGGATTGGAGGGTCTGGTCTAACAGCCGGACTTGGTCTTGAACCGTCGCCCTGTCCCGCACAGGCGCCTGCTGAGCCTGGAGCCCTGGCAGAGGCGGGTCTGGGGAGTGGAGCTGCCAGGAGGCCTCCCATTTCTCACAGCCTTGGTGTTCTCCGGGTCACCCAGAGGACCGTCAAATGCTGGATTTGACAAACTATGTAGAATGTTCTTTGTGTCTTTAAGATCTTCTTGTGGTCCTATTTGGACATTTTGTGCATTTTCAGACACCTGCGGGTCACGTGGGTGGATGGGAAGCTGGGCACCTGGTGAGGGGTGAGGATGTTGAGAGCCAGAGCTGCGTTTTGTCTCTGTTGATGTGGCGAGGCCCTGGGTTGGTCACTGGGATTTTTTTTTTTTTTTGAGACGGTGTCTCGCTCTGTCGCCCAGGCTGGAGTGCAGTGGCATGATCTCGGCTCACTGCAACATCTGCCTCCCGGGTTCAAGCGATTCTCCTGCCTCAGTCTCCTGAGTAGCTGGGATTACAGGCGTCACCACACCTGGCTAATTTTTGTATTTTTAGTAGAGACAGGGTTTCACCATGTTGGTCAGGCTGGTCTTGAACTGATCTCAGGTGATCCGCCCGTCTCGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGCGCCCGGCCGGTCGTTGGGATTTTAACAGCCCTGAGGCCCCTCACGCTGCCAGGTGCCAGCCCACCCTGCAGCCCTGCTCCCCTGCCCACACGCAGAAGCCACCAGAGGCTTCTGGACTGAGCCCCCACTGTCCTGCAGCCGGGCTGGCCTGTCCACACCACAGGGCGTGCTCAGCTACTGAGCAGAAGCGTCACGGACAGGGCAGATCAGGCCAGGACAAAGCTCTTCCGCCACAGGCGGGGGTCTGAAGGCATCTCAGAGGGCCCCCAAACAAGGGACGCTGCCTGGAAACCCCGGGACAAGATGACCTCGGTTCAGATCTTAGCACCTTCTGGCAACCTTAGAGAAAGCTTCTGGAGGGAGGGGCTGGTTCCCAGGATGGGCAGAAGCCGGAAAGTCTCAGACTGAGTGACCCTCGGGGGCTTCAGAAGGCACTGGGTGGGCTCTGCCAGAGTGAGAAGGCAGCTGATGGCTGCTGGAGCCAGCCCCGGGAGTGGGGGTCCAGCTATGGTCTGGAGAGGGGGACTTGAGGGTTGCAGTGGCCACACAGACGGGGCACAGGAGCCAAAGGAAGGGACACAGCAAAGCCCAAGGGTAAAACGGCGCGCCGTGGACTGGTCTGAGGGCAGAGGCTGTAGGGGAGCGAGGGGCGGTGTGGCTGACAGGTGGACACAGGGACACGTGTCCTGTGGACTTGGCCGCTCAGTGGGGGTGTGTCCCCCAGCAGTGGCGTGTGAGGGATGGTCACTCTGATGGGACACTGACCACTTGGCCTCCAGCAAGATCTAGGCCCAAGTCTAGGCTGAAGCCGCCCACTCAGCCCCGGGACATCGTCCCCGGCAGCTCTGCTGAGCACGCCAGCTCCGGCACTCTCCGGGAGTCATGGCCGGAAGTCAACTGTCCTGGCTTCCAGGGCCACACCTTGGCCAGGCCTGGTGATGGTCATTTCCAGCCGCTCCAGTTGGGCTGATGGGGCCACATGAGGCCGGGGATAGAAGGTGGCTGCGCTCAGACACCCCTCCCGGCCCCACTGGATGCCCAGGGCGCTGACCTGCAGGACTCGGATGGGTTTTCTCCTGCCACCCCTGCCTGGCCGGCCACCATCCCAGCGCCAGCGCCCTCCTGAGAGGTGCAGGGGCCGCGTGGGGCCTCCCAGAGTGGCAGGTTGGCAGCCTGCACGCCGGTGACGGCGTCCTTCTCCGTGGTGAGGCTTGGTCCCTCCTCGCCAGAAACACCAATTCTCTGACGTGAGCTGCACATCCACTGCCCAGCCATGTTTACTCTTCTGCCTCCTGTAGACGCAGCCGCGGCGGCTCTCCCTGGCAGGCCACCCGCCGTCCTGCCTTTTCTCCGGGTCAGGCCGCCTGTCTGCCGGGCTCCACGATGAGCGCGTTCTCAAGCTGAGCAGGCGCCAGAATCCCATAGAGAGGCTTGTTGAGACACAGCTTCCCCACCCCCAGCTCGGACGCAGGGGCCTGGCGTGGCCTCCTCACGGGCACGGTGTGGAAACACCACTGGCGGTTACCGTGGTCTGCCGGGTGCATGAGCCCCTGGGGTGGCCCCGTCCCTTGTTTCTGACCAGCCGGATCCTCTCCAGCGGCAGGAGCAGAGAGGGCCCGGAGGTCCAGACGGTGCTCTCTGCGGCCAGCATGCCGCGGAGGTGGCCGAGTGAGTGTGGCCCCTCCCTTGCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTCTGTCTCTGTGTTGTGATGAAACGTC +>ENST00000378546 +TCACTTCCGCCCGGCGCGGGCTTGGATGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTCTGTCTCTGTGTTGTGATGAAA +>ENST00000378543 +GATGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTCTGTCTCTGTGTTGTGATGAAA +>ENST00000401813 +CGGGGTTTCACTATGTTGGCCAGGCTGGTCTAGAACTCCTGACCTCAAGTGATCTGCCCGCCTCGGCCTCCCAAAGTGCTGGGATTGCAGGCGTGAGACACTGCACCCGGACAATTTTCCTTTTCTTACAAGAACACTGCTCACACTGCATTCAGGGCCAACCCTAACCCAGTATCGCCTCATCCTGGTTTGATTATATCGGCACAGACCTTGCTTCCGAGCGAGGCCACTTTCTCAGGTACTGGTGGACATGAGTCTTCGGAGACGCTGCTCAACCCACAGTGCTCCTCCAGCTTGGTTTCTGTGACTTGCCTTCCCCAGAGGAGGGGTGCCCTGAGAGGTCTCCACTCCCTGACCGGCTCCTTGGTGCCGCGCACTCTGAGAGGCTTCCCAGGGAACAGAGCACACAGGACCGCCCTCCTGGGTAGACCAATCAGCATCTGAGCTCACAATTTCCCAGCAGGGCAGTGGGGTGGAGAGAGAAGCCTGGGCTGGGCTGGGCTGGGCTGGGCTGGGGAAGCTTCTCCGGGCGGGGGGACGTCAGAGCAGGATCTGGGGCTGATAAAAGCCCGCCCCTGGGTGGGGGCTGAGTGGTGCGGAAGCTGAGCCCGACACGTGGGGATGGAGGACAGGCTGTGGGAGGGTGTGAACCGGATACTGCTTGAAGGGGTGCTGGGGACTTTGAGAGAGGGCGGCTGGCCCTGTCTGGTCGGGGATGCTGGCCCAGACACAGGCCATGGCTGGGATGGGGTTCAGAAACAGGACCGCTGTCTCTCCCGGGCCAGGGCCCTCCCCAGCTGCTCCTGGCTTTCTGGTTCTTGGGGTCAGGGGCAGGCCTGTGCCATGACCCCGCCACTGAGGCTGTGAGGAGGCTGTCGGTGCCCAAGGGCACCAAGGCACACCCCTACTCTTGCACCCCATGTGTGGGCCCGAGCACCTGCTCTGCTGCCCCAAAGATCTGGCGATGTTTCCCAGGCAACTGTCTCTCACAGCCTGTCTGCCTGGCACTCCCGTATCCCATAAATGCCACCACATCTGGCTATGGGTGGGCGTGCCTGCCTGGCATCCACGGGCCAGCAGGTGTGGTGGAGCACAGCCCAGTTCCTGGCTGCGTCAGAAGGCTGCCCGGGCCTTTTGGCTGTCCTTGCCAGCAGGTGAGCACTGCCAGGGCACCGTGTGTGGGTGCTGGGCCATTTAGCCACATGGGAAGGGGTGGAGGCAGCCCAGTGCCTTCAGCATGTGCCCAGGGTGCCTGTCGGCCACAGGTCTCATTTGGAAATTGGGAGGGTGCACGGCCACCGGGCTGCTTAGGCCTGCCAGCCTCAGGGCCCGTCACCGCTGTCTTAGCCTGATTTGCAGGGTGTCAGCGCTGGGCAGAGATGAACATTTGGGTGACTCTGAGGATGCCAGTGGCTGGGACACTTGTTCTTCCGCGGTGGAAGGAGTTGGAGAGGCCTGGCTCCCTGACCTACGGCCAGCCTGGCTTCTGAAACCAGCTCAGTGGGCTGGGGCCTGATTCATCATCCATAAATGTGTCCTTTTTTGCCACAGAGGGTAAGGGGCCTCCTAGCCCACCGGTCTGCAGGTGCGGGAGTAGGAGATGGGTGGCTCTGATGCCCCCACCCACTCGATCACCTTCTGCTCTGCCTGGGATGCAAACTCCCACAGCTGAAACGTTCTTTTGTAAACATGAATTTTGGCTTAGAAAAAACTCATTTCCACTGTGCACGTGTCAGTCCCAACCAGAAATTATTTTCCAATAAAGCAAAACTCCGTCACCACAGCAGCAGATGGCTCCGAAGAAGTGGAGCGTTTTCATCAGGTTCAACTTTGAAACCTCCACCATCACCATCACCAGCACCGCTGTGTCATGCTGATAACTTGAGGACAGGCAGGACAAGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTCTGTCTCTGTGTTGTGATGAAA +>ENST00000487186 +GAACATGGATGCCTCGCTTTTCAGAGACTCGCGTTCTTGGAACTTACACCCTTTTGGGTTTGCTATTTTTACCCACCCTGAGCCTTCCGGTCTCCATGGCGACGCCTCCAAACAGCAGATTCCAGGCGGCAATGACGTCATCTCTCCCTTTCCTGCCGCCCAGGCCTTGGAGAGATCCAAGGCCTGTGGGCCACGGCTGCGCCTCTCCTGACTCCAGCTTGCCCGTCTGTCCTTGGGGGCAGCGTCCTTCCTTCTCTCGGCCCCAGACGCAGCTGCATCCTGGAGTCCTTCTGAGAAATGTGGGACCTGCCCCAGCTCCACCCCAGGGGCAGCGAGGGAGGCGTTGGATGGAGCCACCCCACGGCTCCTCTGTGAAGGTCTGCACGTCACTCAGAAAGTTGAAGCAAACCAAGCAGGGTTGGAGCCCACAGTTCACAGCCGGCTGCACAGGGGATGCACCAAGCACAGTTTCCTATGACAAGTGGAAACCTGTGCGCCACAGGTGAGCTGGGTCCTGGAAGGTGCAGGGACCAGGCAGCATCTCATCTCAGGACATCAAGGGCTGTCCCCAGCCAGCAGATTTCCCATAAAAACGTGCTGAACTGGGGACAAAGCTGATTCTACAGAGCCGAGAAGCCAGACCTTCCCTGGGGACTCCCGAGGGGGTCCCAGCCACCCTCTCCACCTGCAGAGGTTTCCTGGCCCACTTGGAGGACCTTGGGGGATCCTCCAAGGGCCCCCTTCCAGCTCTTGGCCCATGGGGGAGCCTCTTCCTCAGCTCCGGGTGTGGTGGACAGGAGACCGAGGGCTCCCCGCACCCAGCTGGGCTCAGCGTTTTCAAGCTGAACTTGGTGCGTGGCGGCTTGGAAAGCCGGGAGCCTGCTGCGTGTCTCCTGGGGCTGCTGTGAAAAAATGACCACACACTGGGAGCCTAAAACGAGTGACATGTATATTCTCACAGTTCAGGCAGCTGGTGTCCAAAATCAGTGGTTGGGAGGGTGGAGCTCCGCCTAAAGGCTCTGGGTGGCTGCTGCCTGCCCCTTCCAGCCCCGGGCCCCCGGCATTCCCTGGCGTGCAGCTGCTCCACCCCCAACCCCAAAGCCTCCTTCCTGTGTCTCTGTGTCCAAATTTTCCTTACCTTTTTTTTTTTTTTTTTGAGATAGAGTTTTGCTCTTGTCGCCCAGGCTGGAGTGCAACAGCACGATCTCGGCCTATCGCAACCTCCGCCTCCTGGGTTCAAGCGATTCTCCTGCCTCAGCCTCCTAAGTAGCTGGGATTACAGGTGCCCACCACCACACCCAGCTAATTTTGTATCTTTAGTAGAGATGGGGTTTCACGATGTCTTTCAGGCTGGTCTCGAACTCCTGACCTCACATGATCCACCTGCCTCGGCCTCCCAAAGTGCTGAAATTACAGGCATGAGCCACAGCACCTGGCCAATTTTCCTTTTCTTTCTCTCTCTCTTTTTTTTTTGAGACGGAGTCTTGCTCTGTTGCCCAGGCTGGAGTAAAATGGCACAATCTTGGCTCACTGCAACCTCTGCCTTCTGGGTTCAAGCGATTCTCCTGCCTCAGCCTCCCGAGTAGCTGAGACTACAGGCGCCCACCACCACACCCAGCTAATTTTTGTGTTTTTTAGTAGAGACGGGGTTTCACTATGTTGGCCAGGCTGGTCTAGAACTCCTGACCTCAAGTGATCTGCCCGCCTCGGCCTCCCAAAGTGCTGGGATTGCAGGCGTGAGACACTGCACCCGGACAATTTTCCTTTTCTTACAAGAACACTGCTCACACTGCATTCAGGGCCAACCCTAACCCAGTATCGCCTCATCCTGGTTTGATTATATCGGCACAGACCTTGCTTCCGAGCGAGGCCACTTTCTCAGGTACTGGTGGACATGAGTCTTCGGAGACGCTGCTCAACCCACAGTGCTCCTCCAGCTTGGTTTCTGTGACTTGCCTTCCCCAGAGGAGGGGTGCCCTGAGAGGTCTCCACTCCCTGACCGGCTCCTTGGTGCCGCGCACTCTGAGAGGCTTCCCAGGGAACAGAGCACACAGGACCGCCCTCCTGGGTAGACCAATCAGCATCTGAGCTCACAATTTCCCAGCAGGGCAGTGGGGTGGAGAGAGAAGCCTGGGCTGGGCTGGGCTGGGCTGGGCTGGGGAAGCTTCTCCGGGCGGGGGGACGTCAGAGCAGGATCTGGGGCTGATAAAAGCCCGCCCCTGGGTGGGGGCTGAGTGGTGCGGAAGCTGAGCCCGACACGTGGGGATGGAGGACAGGCTGTGGGAGGGTGTGAACCGGATACTGCTTGAAGGGGTGCTGGGGACTTTGAGAGAGGGCGGCTGGCCCTGTCTGGTCGGGGATGCTGGCCCAGACACAGGCCATGGCTGGGATGGGGTTCAGAAACAGGACCGCTGTCTCTCCCGGGCCAGGGCCCTCCCCAGCTGCTCCTGGCTTTCTGGTTCTTGGGGTCAGGGGCAGGCCTGTGCCATGACCCCGCCACTGAGGCTGTGAGGAGGCTGTCGGTGCCCAAGGGCACCAAGGCACACCCCTACTCTTGCACCCCATGTGTGGGCCCGAGCACCTGCTCTGCTGCCCCAAAGATCTGGCGATGTTTCCCAGGCAACTGTCTCTCACAGCCTGTCTGCCTGGCACTCCCGTATCCCATAAATGCCACCACATCTGGCTATGGGTGGGCGTGCCTGCCTGGCATCCACGGGCCAGCAGGTGTGGTGGAGCACAGCCCAGTTCCTGGCTGCGTCAGAAGGCTGCCCGGGCCTTTTGGCTGTCCTTGCCAGCAGCAAAACTCCGTCACCACAGCAGCAGATGGCTCCGAAGAAGTGGAGCGTTTTCATCAGGTTCAACTTTGAAACCTCCACCATCACCATCACCAGCACCGCTGTGTCATGCTGATAACTTGAGGACAGGCAGGACAAGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTCTGTCTCTGTGTTGTGATGAAA +>ENST00000476803 +GCCCCAGGCCCTCCCGGGTCTCCCCACCATAGCGTTTCCGCTACTGAGTACCCCCTGTCTGCCCTCTCTGTCTGCCCCAGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGCGGGCTCCTGTC +>ENST00000440825 +CGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGAAGCAAAAACAGCTCGGGAATGCGAAGGCACCGGAGTCCAAAGTTGGCAGCCAACAACAACAACAACAAAAGAAAAGGCCGGGCACGGTGGCTCACGCCTGTAATCCCAGCCCTTTGAGAGGCTGAGGCAGGTGGGTTGCTGGAGCCCAGGAGTTTGAGACCAGCCTGGGCAACATGGCAAGATCCCATCTTTACATGCCTGGGCGTGGTGGCGCGTGCCTGTGGTCCTAGCTACTCTGGAGGCTGAAGTGGGAGGATTCCCTTGAGCCAGGAATTGGAGGCTGTAGTGAAGTATGATTGCACCACTGCACTCCAGCCTGGGTGACAGAGCTGACCCAGCTGGATGTTGACAGCCACCTGGCCCAGTGCTTGGCCGAAAGCACAGAAGACGTGACGTGGTGAGCGCCATCCAAGAGCCCTGCGCAGAGTGCGGCGCCCGGACACGCTCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCCAGCAGCCCCGCCTCTCGGCTCCCCCGCATGCGCATTAAAGCAGGGC +>ENST00000420515 +TGGAGGCGGCGCGGAGGCCGCGGCTGGGGTTGAGCCGCCGGAGGCCGCGCCCGGCGGGCGGGCCTTCTGGCGGCCGCCCCTGGTTTCTCCTGGGGGGTGATGAGCGGGAGCGGCTCTGGGCCGAGCTACTGCGCACGGTGAGCCCGGAGCTGATCCTGGATCACGAGGTGCCTTCACTGCCCGCCTTCCCAGGACAGGAGCCCAGGTGCGGCCCGGAGCCCACTGAAGTCTTCACTGTCGGACCCAAGACCTTTTCCTGGACACCCTTTCCGCCGGACCTGTGGGGCCCGGGCCGTTCCTACCGGCTGCTTCACGGGGCAGGAGGGCACCTGGAATCCCCCGCCAGGTCCCTGCCCCAGCGCCCGGCACCTGATCCCTGCAGGGCCCCCAGGGTGGAGCAGCAGCCGTCTGTGGAGGGTGCCGCGGCCCTGCGCAGCTGCCCCATGTGCCAGAAGGAGTTCGCCCCCAGAAGCAAAAACAGCTCGGGAATGCGAAGGCACCGGAGTCCAAAGTTGGCAGCCAACAACAACAACAACAAAAGAAAAGGCCGGGCACGGTGGCTCACGCCTGTAATCCCAGCCCTTTGAGAGGCTGAGGCAGGTGGGTTGCTGGAGCCCAGGAGTTTGAGACCAGCCTGGGCAACATGGCAAGATCCCATCTTTACATGCCTGGGCGTGGTGGCGCGTGCCTGTGGTCCTAGCTACTCTGGAGGCTGAAGTGGGAGGATTCCCTTGAGCCAGGAATTGGAGGCTGTAGTGAAGTATGATTGCACCACTGCACTCCAGCCTGGGTGACAGAGTAAGACCCTGAATCACGGACAGAGGGTACTGTTGGGAGCCCTGGGGAGAAATCCATGCTCTTGGCTGAAGCTCTGAGATCCTTGTTGCTGTCAGGGTGCTGCCCCCCGCCCCCCGGGGAGGGGCTTTTGTCTTTGCATCGCCTGCTTTTCCAGATAGTCTAAAAAAAGACTTCTGAAGACAAGGACGTTCACGAGGAAAAACTTGCCATTTTGAGCTTTTTAAGCAGTTGCTGAAAGCTTGGCAGACTGCCTCAATTTTTCCTAAGTAGGCGTCAATGAAGTCAGGTCCAGGCCTTGGTGTGTCTGGAATGCTTCAAGCACATTCGAACACTTGATCGTAAGGGAGAGCCGGTACTTTGGAACCGGAACTCACCCGAGGCTGTGGCCACCGCATGGGCAGGCTAGCTGGGGGACAAGCCCCATATCTTTGGGAACAAGGGTTTGCACAGCCACCCTGGGATGCCCTGGGACTCCTGACCGCACAGGACCCCAGCAGGGAGGCCGCCTGGATTGGAGGGTCTGGTCTAACAGCCGGACTTGGTCTTGAACCGTCGCCCTGTCCCGCACAGGCGCCTGCTGAGCCTGGAGCCCTGGCAGAGGCGGGTCTGGGGAGTGGAGCTGCCAGGAGGCCTCCCATTTCTCACAGCCTTGGTGTTCTCCGGGTCACCCAGAGGACCGTCAAATGCTGGATTTGACAAACTATGTAGAATGTTCTTTGTGTCTTTAAGATCTTCTTGTGGTCCTA +>ENST00000514625 +CCGCTCACTGTCATGACAAGTGGACAGATGCCCCGGGCCTCAGTTGACCCATCTGTAAGTGGGGCCACGCGACAGCACCTCTGTCACAGGGCTGGGTGTGGGGTGAACAGGCTGGTCCCTGGAGGCAAGTAGTGTGGTGCCCTGAGGCCTGAGGCCAGGCTCCAGGACCGCTCAAGGAACAGGGGATTTGAGGCAACTCAGAGAGGACAGGCCCAGCAGCCGGCCCCAGCCTGATATCTTCCCTCCGCTCAGGCCCCAGACGCAGCTGCATCCTGGAGTCCTTCTGAGAAATGTGGGACCTGCCCCAGCTCCACCCCAGGTGAGGGGCACCAGCCAGCTCCAGAGCTGCCTACCTTCCCTGTCAGGTGCACAGGTCAGCGCCAGGCCAACCCCAGAGCGAGAACACCTGTGCTGGACTGAGCTGGAGCAGCAGGGTGGCCTGCACCGGGGCAGCGAGGGAGGCGTTGGATGGAGCCACCCCACGGCTCCTCTGTGAAGGTCTGCACGTCACTCAGAAAGTTGAAGCAAACCAAGCAGGGTTGGAGCCCACAGTTCACAGCCGGCTGCACAGGGGATGCACCAAGCACAGTTTCCTATGACAAGTGGAAACCTGTGCGCCACAGCAAAACTCCGTCACCACAGCAGCAGATGGCTCCGAAGAAGTGGAGCGTTTTCATCAGGTTCAACTTTGAAACCTCCACCA +>ENST00000420964 +CCTTTCCTGCCGCCCAGGCCTTGGAGAGATCCAAGGCCTGTGGGCCACGGCTGCGCCTCTCCTGACTCCAGCTTGCCCGTCTGTCCTTGGGGGCAGCGTCCTTCCTTCTCTCGGCCCCTTGGAGCAGCTCTGCGGGAACCCCACAGCAGCCCAGCGGATTGAACGCAAAAGACAGCCACCCTCCTGCTCCGGATCCTGGGAGGAGGCTACACGCTGGCGCTGAGACAGCAACCTGCCTGGCCTGGGAAGCCCCCCGCAGCCCCTACATCAGAAGCTTGCTCTTGGCGCAGTGGCTCACGCCTGTAATCCCAGCA +>ENST00000609981 +GCCCTTTGCTGCGGCAGCTTTCTGTTCTCCCTGGCTCCCTGCACGGAACTGAGCTTTGGTGTGTGATGCGCTGCTGGCCCAGGCTACACCCCGACAAGGGACACCGGGGGCCCCGGGAGCAGAGAGACCTCAGAGCAGCCTCCTCCTGCCTCCTGTGGACGGCCGGCCCCAGCTGGTGATCCCAGCCAGTCCCAGCTTTCAGTTGCTGCCCCCACCGACAGTCCTCAGTCCCTCCATGATGGCTCCCCCGACAGCCGGCCCCCTTCCTGGCCCAGCTCTTCCGCCTGAGGACCCAGGGCCGGATCCGGAGAGCAGGTGGCTTTTCTTGAGCGCCAACATTCTGCCCGTGGTGGAGCGGTGCATGGGTGCCATGCAAGAGGGGATGCAGATGGTGAAGCTGCGTGGCGGCTCCAAGGGCCTGGTCCGCTTCTACTACCTGGACGAGCACCGCTCCTGCATCCGCTGGAGGCCCTCACGCAAGAACGAGAAGGCCAAGATCTCCATCGACTCCATCCAGGAGGTGAGTGAGGGGCGGCAGTCGGAGGTCTTCCAGCGCTACCCTGACGGC +>ENST00000449969 +CACGGGCGGGCGCGGCAGGGCAGCGTGTGGGGCTGCGATCGGCATGGGCTCTGCGCGCGGGGTGCCCCTGCTCGGGCTGGGGCTCAGGGGACGCCGGGGGCCAGCACAGGGCCCGGTGTCCCTCGGGCCGTGCCGGTAACTGGGATTGGCACCCGCCGGCCATGGAAGAGCCTGGGCCCCCAGGTGGGCTCAGCCAAGACCAAGTGGAGCGGTGCATGGGTGCCATGCAAGAGGGGATGCAGATGGTGAAGCTGCGTGGCGGCTCCAAGGGCCTGGTCCGCTTCTACTACCTGGACGAGCACCGCTCCTGCATCCGCTGGAGGCCCTCACGCAAGAACGAGAAGGCCAAGATCTCCATCGACTCCATCCAGGAGGTGAGTGAGGGGCGGCAGTCGGAGGTCTTCCAGCGCTACCCTGACGGCAGCTTCGACCCCAACTGCTGCTTCAGCATCTACCACGGCAGCCACCGCGAGTCGCTGGACCTGGTCTCCACCAGCAGCGAGGTGGCGCGCACCTGGGTCACTGGCCTGCGCTACCTCATGGCCGGCATCAGCGACGAGGACAGCCTGGCTCGCCGCCAGCGCACCAGGGACCAATGGCTGAAGCAGACGTTTGACGAGGCCGACAAGAACGGGGATGGCAGCCTGAGCATTGGCGAGGTCCTGCAGCTGCTGCACAAGCTCAACGTGAACCTGCCCCGGCAGAGGGTGAAGCAGATGTTCAGGGAAGCGGACACGGATGACCACCAAGGGACGCTGGGTTTTGAAGAGTTCTGTGCCTTCTACAAGATGATGTCCACCCGCCGGGACCTCTACCTGCTCATGCTGACCTACAGCAACCACAAGGACCACCTGGATGCCGCCAGCCTGCAGCGCTTCCTGCAGGTGGAGCAGAAGATGGCGGGTGTGACCCTCGAGAGCTGCCAGGACATCATCGAGCAGTTTGAGCCATGCCCAGAAAACAAGAGTAAGGGGCTGCTGGGCATTGATGGCTTCACCAACTACACCAGGAGCCCTGCTGGTGACATCTTCAACCCTGAGCACCACCATGTGCACCAGGACATGACGCAGCCGCTGAGCCACTACTTCATCACCTCGTCCCACAACACCTACCTCGTGGGTGACCAGCTCATGTCCCAGTCACGGGTGGACATGTATGCTTGGGTCCTGCAGGCTGGCTGCCGCTGCGTGGAGGTGGACTGCTGGGATGGGCCCGACGGGGAGCCCATTGTGCACCATGGCTACACTCTGACTTCCAAGATCCTCTTCAAAGACGTCATTGAAACCATCAACAAATATGCCTTCATCAAGAATGAGTACCCAGTGATCCTGTCCATCGAAAACCACTGCAGTGTCATCCAGCAGAAGAAAATGGCCCAGTATCTGACTGACATCCTTGGGGACAAGCTGGACCTGTCATCAGTGAGCAGTGAAGATGCCACCACACTCCCCTCTCCACAGATGCTCAAGGGCAAGATCCTCGTGAAGGGGAAGAAGCTCCCAGCCAACATCAGCGAGGATGCGGAGGAAGGCGAGGTGTCTGATGAGGACAGTGCTGATGAGATTGACGATGACTGCAAGCTCCTCAATGGGGATGCATCCACCAATCGAAAGCGTGTAGAAAACACTGCTAAGAGGAAACTGGATTCCCTCATCAAAGAGTCGAAGATTCGGGACTGTGAGGACCCCAACAACTTCTCCGTCTCCACACTGTCCCCATCTGGAAAGCTCGGACGCAAGAGCAAGGCTGAAGAGGACGTGGAGTCTGGGGAGGATGCCGGGGCCAGCAGACGCAATGGCCGCCTCGTCGTGGGAAGCTTCTCCAGGCGCAAGAAGAAGGGCAGCAAGCTGAAGAAGGCGGCCAGCGTGGAGGAGGGAGATGAGGGTCAGGACTCCCCGGGAGGCCAGAGCCGAGGGGCGACCCGGCAGAAGAAGACCATGAAGCTGTCCCGGGCCCTCTCTGACCTGGTGAAGTACACCAAGTCCGTGGCCACCCACGACATAGAGATGGAGGCGGCGTCCAGCTGGCAGGTGTCGTCCTTCAGCGAGACCAAGGCCCACCAGATTCTGCAGCAGAAGCCGGCGCAGTACCTACGCTTCAACCAGCAGCAGCTCTCCCGCATCTACCCCTCCTCCTACCGTGTGGACTCCAGCAACTACAACCCGCAGCCCTTCTGGAACGCCGGCTGCCAAATGGTTGCCCTGAACTACCAGTCAGAGGGGCGGATGCTGCAGCTGAACCGAGCCAAGTTCAGCGCCAACGGTGGCTGCGGCTACGTACTCAAGCCTGGGTGCATGTGCCAGGGCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACGGGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAGGCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGGTAAGGCGCCAGCTGCGGTGGCAGAGAAGAGCCCTGTGCGAGTGCGGCCCCCGCGTGTCCTGGACGGCCCCGGGCCTGCTGGGATGGCCGCCACATGCATGAAGTGTGTGGTGGGATCCTGCGCCGGCGTGAACACCGGGGGCCTGCAGAGGGAGCGGCCACCCAGCCCGGGGCCTGCAAGCAGGCAGGCAGCCATTCGCCAGCAGCCCCGGGCCCGGGCTGACTCACTGGGGGCCCCCTGCTGTGGCCTGGACCCTCACGCTATCCCGGGGAGAAGCAGAGAGGCCCCCAAGGGTCCTGGGGCCTGGAGGCAGGGTCCAGGCGGTAGCGGCTCCATGTCCTCGGACTCCAGCAGCCCAGACAGCCCGGGCATCCCCGAAAGGTCCCCCCGCTGGCCTGAGGGTGCCTGCAGGCAACCGGGGGCCCTGCAGGGAGAGATGAGTGCCTTGTTTGCTCAAAAGCTGGAGGAGATCAGGAGTAAATCCCCCATGTTCTCCGCCGTTAGGAACTGAGAGCGGCGAGTGACAGGTAACGGGGCCCAGCCCCGGTGTCCCGTGCTGTCCCAGCCCAAGGAGGGCCCCGTGTGCGGCACAGGGCGTGGACTGGGCCCCAGCAGCAGCAGGGTGGGGACACCGAGTGTGCCGCGCCCGGGGGATGCCTCGGGGTGGGAGCTGGGCCTGGCGACCCTCGGCACAGGGCACCGGGGACACCACCCTGATCCGACTCCTCTCCGCCTCTCTCCCTGCCTCCCTCTCTCTCTTCTGCTTCTCCCTCTGGCTCTCTCTCACTCCCCCACCTCCCCACAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCCC +>ENST00000419816 +GCGGCTGCGTCAGGGATTCCTTGGTGGCCCTGGAGGGTGGATAGGCTGGCCTGGGGGCCATCAGGACAGCAGGTGACGGTCAGGCCAATGCCAGCCGGGCCTGGGCACAGCCCTGTGGGGGCTTCGGAGGGCCCTGAGGAGGAGGAGGAAGAGGCAGAGGAGAGAAGGCCCCACGGAGGTCCTGTCGCCAGCGCTGCCACTGCCTGACCTCCGCTGCCCGAAGGCCGGTGGGCCTCTGTGGCCTCCGTGAAGCAGGCCCGGCTGTCGTCAGGCCATGTCTGGTCCATGGCCCTCCCCCGACAGCCGGACCAAGGGAACGGTGGCCTGGCTGGCGGAGGTACTCCTCTGGGTTGGAGGGAGTGTGGTGCTGTCTTCAGAGTGGCAGCTCGGCCCCCTGGTGGAGCGGTGCATGGGTGCCATGCAAGAGGGGATGCAGATGGTGAAGCTGCGTGGCGGCTCCAAGGGCCTGGTCCGCTTCTACTACCTGGACGAGCACCGCTCCTGCATCCGCTGGAGGCCCTCACGCAAGAACGAGAAGGCCAAGATCTCCATCGACTCCATCCAGGAGGTGAGTGAGGGGCGGCAGTCGGAGGTCTTCCAGCGCTACCCTGACGGCAGCTTCGACCCCAACTGCTGCTTCAGCATCTACCACGGCAGCCACCGCGAGTCGCTGGACCTGGTCTCCACCAGCAGCGAGGTGGCGCGCACCTGGGTCACTGGCCTGCGCTACCTCATGGCCGGCATCAGCGACGAGGACAGCCTGGCTCGCCGCCAGCGCACCAGGGACCAATGGCTGAAGCAGACGTTTGACGAGGCCGACAAGAACGGGGATGGCAGCCTGAGCATTGGCGAGGTCCTGCAGCTGCTGCACAAGCTCAACGTGAACCTGCCCCGGCAGAGGGTGAAGCAGATGTTCAGGGAAGCGGACACGGATGACCACCAAGGGACGCTGGGTTTTGAAGAGTTCTGTGCCTTCTACAAGATGATGTCCACCCGCCGGGACCTCTACCTGCTCATGCTGACCTACAGCAACCACAAGGACCACCTGGATGCCGCCAGCCTGCAGCGCTTCCTGCAGGTGGAGCAGAAGATGGCGGGTGTGACCCTCGAGAGCTGCCAGGACATCATCGAGCAGTTTGAGCCATGCCCAGAAAACAAGAGTAAGGGGCTGCTGGGCATTGATGGCTTCACCAACTACACCAGGAGCCCTGCTGGTGACATCTTCAACCCTGAGCACCACCATGTGCACCAGGACATGACGCAGCCGCTGAGCCACTACTTCATCACCTCGTCCCACAACACCTACCTCGTGGGTGACCAGCTCATGTCCCAGTCACGGGTGGACATGTATGCTTGGGTCCTGCAGGCTGGCTGCCGCTGCGTGGAGGTGGACTGCTGGGATGGGCCCGACGGGGAGCCCATTGTGCACCATGGCTACACTCTGACTTCCAAGATCCTCTTCAAAGACGTCATTGAAACCATCAACAAATATGCCTTCATCAAGAATGAGTACCCAGTGATCCTGTCCATCGAAAACCACTGCAGTGTCATCCAGCAGAAGAAAATGGCCCAGTATCTGACTGACATCCTTGGGGACAAGCTGGACCTGTCATCAGTGAGCAGTGAAGATGCCACCACACTCCCCTCTCCACAGATGCTCAAGGGCAAGATCCTCGTGAAGGGGAAGAAGCTCCCAGCCAACATCAGCGAGGATGCGGAGGAAGGCGAGGTGTCTGATGAGGACAGTGCTGATGAGATTGACGATGACTGCAAGCTCCTCAATGGGGATGCATCCACCAATCGAAAGCGTGTAGAAAACACTGCTAAGAGGAAACTGGATTCCCTCATCAAAGAGTCGAAGATTCGGGACTGTGAGGACCCCAACAACTTCTCCGTCTCCACACTGTCCCCATCTGGAAAGCTCGGACGCAAGAGCAAGGCTGAAGAGGACGTGGAGTCTGGGGAGGATGCCGGGGCCAGCAGACGCAATGGCCGCCTCGTCGTGGGAAGCTTCTCCAGGCGCAAGAAGAAGGGCAGCAAGCTGAAGAAGGCGGCCAGCGTGGAGGAGGGAGATGAGGGTCAGGACTCCCCGGGAGGCCAGAGCCGAGGGGCGACCCGGCAGAAGAAGACCATGAAGCTGTCCCGGGCCCTCTCTGACCTGGTGAAGTACACCAAGTCCGTGGCCACCCACGACATAGAGATGGAGGCGGCGTCCAGCTGGCAGGTGTCGTCCTTCAGCGAGACCAAGGCCCACCAGATTCTGCAGCAGAAGCCGGCGCAGTACCTACGCTTCAACCAGCAGCAGCTCTCCCGCATCTACCCCTCCTCCTACCGTGTGGACTCCAGCAACTACAACCCGCAGCCCTTCTGGAACGCCGGCTGCCAAATGGTTGCCCTGAACTACCAGTCAGAGGGGCGGATGCTGCAGCTGAACCGAGCCAAGTTCAGCGCCAACGGTGGCTGCGGCTACGTACTCAAGCCTGGGTGCATGTGCCAGGGCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACGGGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAGGCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCC +>ENST00000378486 +GCGGCTGCGTCAGGGATTCCTTGGTGGCCCTGGAGGGTGGATAGGCTGGCCTGGGGGCCATCAGGACAGCAGGTGACGGTCAGGCCAATGCCAGCCGGGCCTGGGCACAGCCCTGTGGGGGCTTCGGAGGGCCCTGAGGAGGAGGAGGAAGAGGCAGAGGAGAGAAGGCCCCACGGAGGTCCTGTCGCCAGCGCTGCCACTGCCTGACCTCCGCTGCCCGAAGGCCGGTGGGCCTCTGTGGCCTCCGTGAAGCAGGCCCGGCTGTCGTCAGGCCATGTCTGGTCCATGGCCCTCCCCCGACAGCCGGACCAAGGGAACGGTGGCCTGGCTGGCGGAGGTACTCCTCTGGGTTGGAGGGAGTGTGGTGCTGTCTTCAGAGTGGCAGCTCGGCCCCCTGGTGGAGCGGTGCATGGGTGCCATGCAAGAGGGGATGCAGATGGTGAAGCTGCGTGGCGGCTCCAAGGGCCTGGTCCGCTTCTACTACCTGGACGAGCACCGCTCCTGCATCCGCTGGAGGCCCTCACGCAAGAACGAGAAGGCCAAGATCTCCATCGACTCCATCCAGGAGGTGAGTGAGGGGCGGCAGTCGGAGGTCTTCCAGCGCTACCCTGACGGCAGCTTCGACCCCAACTGCTGCTTCAGCATCTACCACGGCAGCCACCGCGAGTCGCTGGACCTGGTCTCCACCAGCAGCGAGGTGGCGCGCACCTGGGTCACTGGCCTGCGCTACCTCATGGCCGGCATCAGCGACGAGGACAGCCTGGCTCGCCGCCAGCGCACCAGGGACCAGTGGCTGAAGCAGACGTTTGACGAGGCCGACAAGAACGGGGATGGCAGCCTGAGCATTGGCGAGGTCCTGCAGCTGCTGCACAAGCTCAACGTGAACCTGCCCCGGCAGAGGGTGAAGCAGATGTTCAGGGAAGCGGACACGGATGACCACCAAGGGACGCTGGGTTTTGAAGAGTTCTGTGCCTTCTACAAGATGATGTCCACCCGCCGGGACCTCTACCTGCTCATGCTGACCTACAGCAACCACAAGGACCACCTGGATGCCGCCAGCCTGCAGCGCTTCCTGCAGGTGGAGCAGAAGATGGCGGGTGTGACCCTCGAGAGCTGCCAGGACATCATCGAGCAGTTTGAGCCATGCCCAGAAAACAAGAGTAAGGGGCTGCTGGGCATTGATGGCTTCACCAACTACACCAGGAGCCCTGCTGGTGACATCTTCAACCCTGAGCACCACCATGTGCACCAGGACATGACGCAGCCGCTGAGCCACTACTTCATCACCTCGTCCCACAACACCTACCTCGTGGGTGACCAGCTCATGTCCCAGTCACGGGTGGACATGTATGCTTGGGTCCTGCAGGCTGGCTGCCGCTGCGTGGAGGTGGACTGCTGGGATGGGCCCGACGGGGAGCCCATTGTGCACCATGGCTACACTCTGACTTCCAAGATCCTCTTCAAAGACGTCATTGAAACCATCAACAAATATGCCTTCATCAAGAATGAGTACCCAGTGATCCTGTCCATCGAAAACCACTGCAGTGTCATCCAGCAGAAGAAAATGGCCCAGTATCTGACTGACATCCTTGGGGACAAGCTGGACCTGTCATCAGTGAGCAGTGAAGATGCCACCACACTCCCCTCTCCACAGATGCTCAAGGGCAAGATCCTCGTGAAGGGGAAGAAGCTCCCAGCCAACATCAGCGAGGATGCGGAGGAAGGCGAGGTGTCTGATGAGGACAGTGCTGATGAGATTGACGATGACTGCAAGCTCCTCAATGGGGATGCATCCACCAATCGAAAGCGTGTAGAAAACACTGCTAAGAGGAAACTGGATTCCCTCATCAAAGAGTCGAAGATTCGGGACTGTGAGGACCCCAACAACTTCTCCGTCTCCACACTGTCCCCATCTGGAAAGCTCGGACGCAAGAGCAAGGCTGAAGAGGACGTGGAGTCTGGGGAGGATGCCGGGGCCAGCAGACGCAATGGCCGCCTCGTCGTGGGAAGCTTCTCCAGGCGCAAGAAGAAGGGCAGCAAGCTGAAGAAGGCGGCCAGCGTGGAGGAGGGAGATGAGGGTCAGGACTCCCCGGGAGGCCAGAGCCGAGGGGCGACCCGGCAGAAGAAGACCATGAAGCTGTCCCGGGCCCTCTCTGACCTGGTGAAGTACACCAAGTCCGTGGCCACCCACGACATAGAGATGGAGGCGGCGTCCAGCTGGCAGGTGTCGTCCTTCAGCGAGACCAAGGCCCACCAGATTCTGCAGCAGAAGCCGGCGCAGTACCTACGCTTCAACCAGCAGCAGCTCTCCCGCATCTACCCCTCCTCCTACCGTGTGGACTCCAGCAACTACAACCCGCAGCCCTTCTGGAACGCCGGCTGCCAAATGGTTGCCCTGAACTACCAGTCAGAGGGGCGGATGCTGCAGCTGAACCGAGCCAAGTTCAGCGCCAACGGTGGCTGCGGCTACGTACTCAAGCCTGGGTGCATGTGCCAGGGCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACGGGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAGGCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCC +>ENST00000343889 +CACAGGGAACGGGTAGGGTCCCACGGTTTGGGGAGAGACATGGCAGTCCTCAAGGGCTGGGATCAGGGCGCAGCCAGGGTTTCTGATGGCTTTGCTGATGGTCAGGACCCAGGCATGCCAGGCAAGGCCTCAGCCCAGCAGTTGCCAAGCGTGTAGCCACTTTGGGCCCGTGGAGAGAGTCGCGCTGCGGAGCCCCCAGGGGGACCTGAGGTCACAAGAGCCTCGATGCACCTGAGCGCGGAGCTGGGGGTCCCTGGAGCCGCTGTCCCCACCTGCGGCGCTGGAGCCCTGGAGGTGTCCAGGGGCTTCCTTGGAACGTGGAGACGTGCTGGTTAAACGTGGAGCCCCGGGCCAGCCGGGCACTGGGGGCTGCAGGTGGAGGGAGGTGGATGCTCTCCCTCGTGGGGGCGTGTCTTTTCCACAGGAAAGGGAAAGGGGGAGGGACACGGGTCAGCAGTGGGGGGCTGTGCAGTCTCGCAGATCTTCACCCTTGGTTCTTGAACTCTGGACCCTGAGCCCTGCCGAGGGTCCCGCAAAGGTGGGCAAGGAGCTCCCGGCTGCTTGGTCTCCGCAGTGTTGGGGCTGCCAGCAGGGGGACGCTGGGCCCCCGGGGACCTGACCCGTGCTCCCTCCCCACCCCGCAGTCTCCATCGACTCCATCCAGGAGGTGAGTGAGGGGCGGCAGTCGGAGGTCTTCCAGCGCTACCCTGACGGCAGCTTCGACCCCAACTGCTGCTTCAGCATCTACCACGGCAGCCACCGCGAGTCGCTGGACCTGGTCTCCACCAGCAGCGAGGTGGCGCGCACCTGGGTCACTGGCCTGCGCTACCTCATGGCCGGCATCAGCGACGAGGACAGCCTGGCTCGCCGCCAGCGCACCAGGGACCAATGGCTGAAGCAGACGTTTGACGAGGCCGACAAGAACGGGGATGGCAGCCTGAGCATTGGCGAGGTCCTGCAGCTGCTGCACAAGCTCAACGTGAACCTGCCCCGGCAGAGGGTGAAGCAGATGTTCAGGGAAGCGGACACGGATGACCACCAAGGGACGCTGGGTTTTGAAGAGTTCTGTGCCTTCTACAAGATGATGTCCACCCGCCGGGACCTCTACCTGCTCATGCTGACCTACAGCAACCACAAGGACCACCTGGATGCCGCCAGCCTGCAGCGCTTCCTGCAGGTGGAGCAGAAGATGGCGGGTGTGACCCTCGAGAGCTGCCAGGACATCATCGAGCAGTTTGAGCCATGCCCAGAAAACAAGAGTAAGGGGCTGCTGGGCATTGATGGCTTCACCAACTACACCAGGAGCCCTGCTGGTGACATCTTCAACCCTGAGCACCACCATGTGCACCAGGACATGACGCAGCCGCTGAGCCACTACTTCATCACCTCGTCCCACAACACCTACCTCGTGGGTGACCAGCTCATGTCCCAGTCACGGGTGGACATGTATGCTTGGGTCCTGCAGGCTGGCTGCCGCTGCGTGGAGGTGGACTGCTGGGATGGGCCCGACGGGGAGCCCATTGTGCACCATGGCTACACTCTGACTTCCAAGATCCTCTTCAAAGACGTCATTGAAACCATCAACAAATATGCCTTCATCAAGAATGAGTACCCAGTGATCCTGTCCATCGAAAACCACTGCAGTGTCATCCAGCAGAAGAAAATGGCCCAGTATCTGACTGACATCCTTGGGGACAAGCTGGACCTGTCATCAGTGAGCAGTGAAGATGCCACCACACTCCCCTCTCCACAGATGCTCAAGGGCAAGATCCTCGTGAAGGGGAAGAAGCTCCCAGCCAACATCAGCGAGGATGCGGAGGAAGGCGAGGTGTCTGATGAGGACAGTGCTGATGAGATTGACGATGACTGCAAGCTCCTCAATGGGGATGCATCCACCAATCGAAAGCGTGTAGAAAACACTGCTAAGAGGAAACTGGATTCCCTCATCAAAGAGTCGAAGATTCGGGACTGTGAGGACCCCAACAACTTCTCCGTCTCCACACTGTCCCCATCTGGAAAGCTCGGACGCAAGAGCAAGGCTGAAGAGGACGTGGAGTCTGGGGAGGATGCCGGGGCCAGCAGACGCAATGGCCGCCTCGTCGTGGGAAGCTTCTCCAGGCGCAAGAAGAAGGGCAGCAAGCTGAAGAAGGCGGCCAGCGTGGAGGAGGGAGATGAGGGTCAGGACTCCCCGGGAGGCCAGAGCCGAGGGGCGACCCGGCAGAAGAAGACCATGAAGCTGTCCCGGGCCCTCTCTGACCTGGTGAAGTACACCAAGTCCGTGGCCACCCACGACATAGAGATGGAGGCGGCGTCCAGCTGGCAGGTGTCGTCCTTCAGCGAGACCAAGGCCCACCAGATTCTGCAGCAGAAGCCGGCGCAGTACCTACGCTTCAACCAGCAGCAGCTCTCCCGCATCTACCCCTCCTCCTACCGTGTGGACTCCAGCAACTACAACCCGCAGCCCTTCTGGAACGCCGGCTGCCAAATGGTTGCCCTGAACTACCAGTCAGAGGGGCGGATGCTGCAGCTGAACCGAGCCAAGTTCAGCGCCAACGGTGGCTGCGGCTACGTACTCAAGCCTGGGTGCATGTGCCAGGGCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACGGGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAGGCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGGTAAGGCGCCAGCTGCGGTGGCAGAGAAGAGCCCTGTGCGAGTGCGGCCCCCGCGTGTCCTGGACGGCCCCGGGCCTGCTGGGATGGCCGCCACATGCATGAAGTGTGTGGTGGGATCCTGCGCCGGCGTGAACACCGGGGGCCTGCAGAGGGAGCGGCCACCCAGCCCGGGGCCTGCAAGCAGGCAGGCAGCCATTCGCCAGCAGCCCCGGGCCCGGGCTGACTCACTGGGGGCCCCCTGCTGTGGCCTGGACCCTCACGCTATCCCGGGGAGAAGCAGAGAGGCCCCCAAGGGTCCTGGGGCCTGGAGGCAGGGTCCAGGCGGTAGCGGCTCCATGTCCTCGGACTCCAGCAGCCCAGACAGCCCGGGCATCCCCGAAAGGTCCCCCCGCTGGCCTGAGGGTGCCTGCAGGCAACCGGGGGCCCTGCAGGGAGAGATGAGTGCCTTGTTTGCTCAAAAGCTGGAGGAGATCAGGAGTAAATCCCCCATGTTCTCCGCCGGTAAGCCCCTCTTGCCCTGCGTGGTCCTCCCGCACGCCCCTGGCATGGCTGGGCCTGGGTCACCTGCTGCTGCTTCTGCGTGGACGGTGTCGCCTCGTGTGCTCGTGCTCGTGGCTCTGTATCCGTGGCACTGTCTCCGTGGCACTCTGCTCCCTTGGCTTGCCTGTGGCCCATAGCCCCAGCCCTCCTGTCTGAGCTTGAGGCCCTGGGACTTGGGTGGAGCTGGTTTGAGGCCCGACAGGCTGGGAAGAACCAGCTGCTCTTGCTGAGGGTCTGGGGCCGGGACTGTGGCCTGACATGCTGGGCCCCTCCGGCTGGGCGCTTCCCCAAACTCACCTCCTGGGCGGCTGGCGACCTGCATGGCCCCTGATGCCTTTCCTGGGACTGGGGGCCACGTACCATCCCATTCCCACCTCCCTCTAGGGCAGGCTCCAGGGGTCCCTACTGGGAAGTCTGATGTGGGCAGGTAGTGCAGCTGCTGGGCGTCTCCTGCGCCCCTGGGACGCCTGGAGCCTGCTGAGTGCTGCGTGGAGTAGATTCCCTGGGCCCCAGGGCTTCGCTGCTTTGGGCTGAAGCACCCCACTAGAAGGGTGTCTCCTTAGCCTGGAGGGAGGGACATACACGGAGCCCGCCCCACACCACCCTGCCCCTCCAGACCCCCCTGACCAAGCTTTCCTTTCTGCCCCCACCCACGCTGCCTCCGTAGTTAGGAACTGAGAGCGGCGAGTGACAGGTAACGGGGCCCAGCCCCGGTGTCCCGTGCTGTCCCAGCCCAAGGAGGGCCCCGTGTGCGGCACAGGGCGTGGACTGGGCCCCAGCAGCAGCAGGGTGGGGACACCGAGTGTGCCGCGCCCGGGGGATGCCTCGGGGTGGGAGCTGGGCCTGGCGACCCTCGGCACAGGGCACCGGGGACACCACCCTGATCCGACTCCTCTCCGCCTCTCTCCCTGCCTCCCTCTCTCTCTTCTGCTTCTCCCTCTGGCTCTCTCTCACTCCCCCACCTCCCCACAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCCCTTTC +>ENST00000278878 +GGCGCGCACCTGGGTCACTGGCCTGCGCTACCTCATGGCCGGCATCAGCGACGAGGACAGCCTGGCTCGCCGCCAGCGCACCAGGGACCAATGGCTGAAGCAGACGTTTGACGAGGCCGACAAGAACGGGGATGGCAGCCTGAGCATTGGCGAGGTCCTGCAGCTGCTGCACAAGCTCAACGTGAACCTGCCCCGGCAGAGGGTGAAGCAGATGTTCAGGGAAGCGGACACGGATGACCACCAAGGGACGCTGGGTTTTGAAGAGTTCTGTGCCTTCTACAAGATGATGTCCACCCGCCGGGACCTCTACCTGCTCATGCTGACCTACAGCAACCACAAGGACCACCTGGATGCCGCCAGCCTGCAGCGCTTCCTGCAGGTGGAGCAGAAGATGGCGGGTGTGACCCTCGAGAGCTGCCAGGACATCATCGAGCAGTTTGAGCCATGCCCAGAAAACAAGAGTAAGGGGCTGCTGGGCATTGATGGCTTCACCAACTACACCAGGAGCCCTGCTGGTGACATCTTCAACCCTGAGCACCACCATGTGCACCAGGACATGACGCAGCCGCTGAGCCACTACTTCATCACCTCGTCCCACAACACCTACCTCGTGGGTGACCAGCTCATGTCCCAGTCACGGGTGGACATGTATGCTTGGGTCCTGCAGGCTGGCTGCCGCTGCGTGGAGGTGGACTGCTGGGATGGGCCCGACGGGGAGCCCATTGTGCACCATGGCTACACTCTGACTTCCAAGATCCTCTTCAAAGACGTCATTGAAACCATCAACAAATATGCCTTCATCAAGAATGAGTACCCAGTGATCCTGTCCATCGAAAACCACTGCAGTGTCATCCAGCAGAAGAAAATGGCCCAGTATCTGACTGACATCCTTGGGGACAAGCTGGACCTGTCATCAGTGAGCAGTGAAGATGCCACCACACTCCCCTCTCCACAGATGCTCAAGGGCAAGATCCTCGTGAAGGGGAAGAAGCTCCCAGCCAACATCAGCGAGGATGCGGAGGAAGGCGAGGTGTCTGATGAGGACAGTGCTGATGAGATTGACGATGACTGCAAGCTCCTCAATGGGGATGCATCCACCAATCGAAAGCGTGTAGAAAACACTGCTAAGAGGAAACTGGATTCCCTCATCAAAGAGTCGAAGATTCGGGACTGTGAGGACCCCAACAACTTCTCCGTCTCCACACTGTCCCCATCTGGAAAGCTCGGACGCAAGAGCAAGGCTGAAGAGGACGTGGAGTCTGGGGAGGATGCCGGGGCCAGCAGACGCAATGGCCGCCTCGTCGTGGGAAGCTTCTCCAGGCGCAAGAAGAAGGGCAGCAAGCTGAAGAAGGCGGCCAGCGTGGAGGAGGGAGATGAGGGTCAGGACTCCCCGGGAGGCCAGAGCCGAGGGGCGACCCGGCAGAAGAAGACCATGAAGCTGTCCCGGGCCCTCTCTGACCTGGTGAAGTACACCAAGTCCGTGGCCACCCACGACATAGAGATGGAGGCGGCGTCCAGCTGGCAGGTGTCGTCCTTCAGCGAGACCAAGGCCCACCAGATTCTGCAGCAGAAGCCGGCGCAGTACCTACGCTTCAACCAGCAGCAGCTCTCCCGCATCTACCCCTCCTCCTACCGTGTGGACTCCAGCAACTACAACCCGCAGCCCTTCTGGAACGCCGGCTGCCAAATGGGCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACGGGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAGGCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGC +>ENST00000473964 +GTGGGGGAACCCTCCTTGCTAGCGTTGCAAAGAAGGGCCCAGCTCCGTCAGGAATCCAGGGATGGAGAACTGGGGAGCCTGGGCCCCACATGAGATTCATGGCAGGACTTGTCTGAGGGGCCCCAGTGCCAGCGACCCAGCCCCCTGTGCCTGGCCCCTCTGTGGGTCTCAGGACCTGGGTCTGGGCTGGGTGTTTGGAGGAACCTCCTCCCGGCTCTCAGACACCTCTGTTTTGTCTGCTGTGGATGACTTCCAGCTTGGTCCCCCTGTGGCCCTGGCAGGAGTATCACCATGGGAGAGGGCAGGACAGGGGCTGGGCGAGCAGGCCTCCCACTAGACCAGGCTACTCCTGCTGTGGACCAGCTACTTCCACCTCTGCCCTTGGCTTGCCCTCCTCAGAGTTCTCAGCCTGAGTGGGCCCTGGGGACACTGTCACCAGAGACCCCACCCCTCATACCCCCAGGGACCCAGACCCACCCCCAGAAGCCATGTGACCTCCTCGGCTCAGCTGTGGGAGGCATGGGCTCTGTCCCACATGCTGCGGTAGCCACAAAGGTGATCCATACTGGGCCAGGTGCACCCCGAGGTGCCCCCCTGGACCACTGCCTCCCTCCCTCCCCCTGGCACCGGCTCCAGTCTCCTATGTGGGGGCTGGGGAGGGGGCTGTTGGCAGCCATGCCCCAGCAAGCAGGGGGCTTGCTGAGGGCTGGGCCACTGACCACCTCCCCGGCATCCCCTCAGGCGTGTTCAACCCCAACTCGGAGGACCCCCTGCCCGGGCAGCTCAAGAAGCAGCTGGTGCTCCGGATCATCAGTGGCCAGCAGCTTCCCAAGCCGCGCGACTCCATGCTGGGGGACCGTGGGGAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACGGGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAGGCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTGAGTGTCACCCCCTGCCACCAGCCATCATGGGGAGGGGCCACACCAGCCCCTTGTCCCATGCCCCCCCATGTGTCCCCAGTGCTGGGTCCTGAACTCAGGCAGTGAGGCCTAGGGTCCCCTCCCCGGGCCTCTGCTCCTCTATCTCAAGAGGGGCTGCTGTGGGGGCCTGGCTCCTGAGCCACCAGTGCCCACCTCTGATCTCAGGGCTGGCTTTGGGCATCTCGGGCAGGACAGGTCCTGAGTGCTCCGGGCCTTGCCCCGCCCTGTGTCACCCATGCCTGTCTCAGACTCTTGGGGGCCTTGCAGCCTCCACCCCTACAGTGCTGCCATCTGGCTTCTCAGCAGGGACCGAGTGATGCCCCTCTCCCCTCTACTACCCCCCACCCCTCTACTTCCTGGTGTCACGTGGAAGGCAGCTGCCCGGGTTTGCCTGTGACTCCACACCCAGCATGTCTGTCCCCTGCCCCAGGTCAGGGTGGGGCCTCGGCTTCCGCAGGAAGTGGTCTTGGTGCCAGCCCTGCTGCCCTGGCTTTGAGCTGGGGCCCAGTGCCCTCTGGGTCCTGCTGGCTGCAGCTGGCCCTCGGGGAACCCGCACACACAGCAGGAGGGGCCTGCCCAGGCCCAGTGCTGACTCTCTCCTGCCATGCTCTCGGGCCCAGAGGTGCCATCCAGCCCCTGCCGTCTATCCACCCATCTGTTCCTCGTCCCCCAGGCTGCAGGGCTCCCCACGCCACTGCTGTGGCCGCCTCACCTGCTCCCCCTGTCTCTTTGGTCTTGCAGTCGGCTTCTCTATGGCCACAGCCTACTTTTAGAAGTGCAGCTCTGTTAGGAGCCTTGAAGGTACCCGGTGCGCGGGACAGTGCGGCCCGCCGCCCCTGCATGCCCAGGCCGCACCCCATTAGCATCCATGATTCCTGGTAGCATTTGGAGACTGTCGCTCATGTGACGTGGATCATGACATGGCTCCGGGGGCCCTGGCCATCCCCAGCCATAGTGGCATTTACGAGGCAGATCCAGGGTTCAGCTGGGTGGCCGCCTTCTCACTGGCCTCTCCTCCCCTCCCCTCCCTCAGTCCTCCCTCCCCTCCCTCAGTCCTCCCTCCCCTCCCTCAGTCCTCCCTCCCCTCCCTCAGTCCTCCCTCCCCTCCCTCAGCCCCTTCCCTGGCGGGCAGCCCGCTGGAGCCCCCACTGTGCCCCTCCTATCCCCCTCCTTCTCTCTCCTGCCCCCATCTCGGACCCTCAGGCTGTTGGTTCTGAGTTCGCCTCCCACTCCCTCCCTGTCCTTGCCAACCATGCCAGTGCATGGGATGAGGGCACCCCTGAGGCCGGCGCTCCGAGCCAGAATCCCGGATCTGCTTCTAAATGGCTTCCCAGCCACTGTGACCAAATGCGTAGATTTGGGATCTTGAATCAGGAAGCTGATTCAAGTGCTGGCCATCTGAACGCATCTGCCCAGAGGCGCCCCTGCAGGGGGGTGACCCACCTGCCGGGCCTGGGCCGCTCTGTGCACGAGCACGGCTCGTCATGGGGGCGCGGTGGGTGCTGTCTCGGGGGCATCTGGCATGTGAGGGCCCCTCTGGCCTCTGCGCCCTGGAGATGCGGCTGCCTCCCTCTCAGCAGCTGTTCTGCCCAGGCAGGGACCTCCTGGGCCCAGCTGTCCAGGAAGATTGGCTGTGGCCAGGTGCTGGTGGGCTGGGAGTCTGAGCCCATCTTGGCAGGGCTCAGGGGGCAGCAAGCCAGCTGCGGGCCTTGGGGGCTCACATGAGTGGAGGGCAGGGCAAGACCAGAAAAGGCTGCCTGGGGGAATTCAGGAAGGCTTCCTGGAAGAGGTGGTACTTCCTAGGGCACGAGTATCACCATGGGAGTGGGCAGGACACGGGCCGGGCAAGTGGGCCTCCCGCTGCACCTGGCTACTCCTGCTGTGGACCAGCTACTCCTGCCTGAGGGTGGGGCACACACAACCAGGGAGTGCCACGCCAGTGTCCCCTGCTAGCGCCGGGGGCTGCGGGCCTCTGAGCAGGTGCAGGCTGTGGTGGGCCAGGCTGGGGCTCGAGGTCTCTCCTCCGGAGGGAAAGACCTTCTCTCCATGCCCCTCAAGGGCCCCACATGCCCTGGACAGGTCAGGCGAGGGCAGTTTCTGCCGGAAGGGTGGGGTGGGCCATGTGTACTTAGATCTGTAGCAGCTACTGTCCCAGGCAGAGCTGCCCTAGGGACCCTGCTCCTGAAGGCCCTGGTGTGTCCACACACCCCCAGCCTGAGGTGGCCCAGCCCCTCGGACCGAGACACGCATGGCACGTCTGTGGCACGGTCTGGAGAGCTGGCCCTGGGGGAGCAGCTGCAGCTGGGCTGGGACCCCTGGCAACAGCTACATGGGCTCCTTCTCTTGCAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGGTAAGGCGCCAGCTGCGGTGGCAGAGAAGAGCCCTGTGCGAGTGCGGCCCCCGCGTGTCCTGGACGGCCCCGGGCCTGCTGGGATGGCCGCCACATGCATGAAGTGTGTGGTGGGATCCTGCGCCGGCGTGAACACCGGGGGCCTGCAGAGGGAGCGGCCACCCAGCCCGGGGCCTGCAAGCAGGCAGGCAGCCATTCGCCAGCAGCCCCGGGCCCGGGCTGACTCACTGGGGGCCCCCTGCTGTGGCCTGGACCCTCACGCTATCCCGGGGAGAAGCAGAGAGGCCCCCAAGGGTCCTGGGGCCTGGAGGCAGGGTCCAGGCGGTAGCGGCTCCATGTCCTCGGACTCCAGCAGCCCAGACAGCCCGGGCATCCCCGAAAGGTCCCCCCGCTGGCCTGAGGGTGCCTGCAGGCAACCGGGGGCCCTGCAGGGAGAGATGAGTGCCTTGTTTGCTCAAAAGCTGGAGGAGATCAGGAGTAAATCCCCCATGTTCTCCGCCGGTAAGCCCCTCTTGCCCTGCGTGGTCCTCCCGCACGCCCCTGGCATGGCTGGGCCTGGGTCACCTGCTGCTGCTTCTGCGTGGACGGTGTCGCCTCGTGTGCTCGTGCTCGTGGCTCTGTATCCGTGGCACTGTCTCCGTGGCACTCTGCTCCCTTGGCTTGCCTGTGGCCCATAGCCCCAGCCCTCCTGTCTGAGCTTGAGGCCCTGGGACTTGGGTGGAGCTGGTTTGAGGCCCGACAGGCTGGGAAGAACCAGCTGCTCTTGCTGAGGGTCTGGGGCCGGGACTGTGGCCTGACATGCTGGGCCCCTCCGGCTGGGCGCTTCCCCAAACTCACCTCCTGGGCGGCTGGCGACCTGCATGGCCCCTGATGCCTTTCCTGGGACTGGGGGCCACGTACCATCCCATTCCCACCTCCCTCTAGGGCAGGCTCCAGGGGTCCCTACTGGGAAGTCTGATGTGGGCAGGTAGTGCAGCTGCTGGGCGTCTCCTGCGCCCCTGGGACGCCTGGAGCCTGCTGAGTGCTGCGTGGAGTAGATTCCCTGGGCCCCAGGGCTTCGCTGCTTTGGGCTGAAGCACCCCACTAGAAGGGTGTCTCCTTAGCCTGGAGGGAGGGACATACACGGAGCCCGCCCCACACCACCCTGCCCCTCCAGACCCCCCTGACCAAGCTTTCCTTTCTGCCCCCACCCACGCTGCCTCCGTAGTTAGGAACTGAGAGCGGCGAGTGACAGGTAACGGGGCCCAGCCCCGGTGTCCCGTGCTGTCCCAGCCCAAGGAGGGCCCCGTGTGCGGCACAGGGCGTGGACTGGGCCCCAGCAGCAGCAGGGTGGGGACACCGAGTGTGCCGCGCCCGGGGGATGCCTCGGGGTGGGAGCTGGGCCTGGCGACCCTCGGCACAGGGCACCGGGGACACCACCCTGATCCGACTCCTCTCCGCCTCTCTCCCTGCCTCCCTCTCTCTCTTCTGCTTCTCCCTCTGGCTCTCTCTCACTCCCCCACCTCCCCACAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCCCTT +>ENST00000462379 +GGTGGGGGCCAGCCCCACACAGGCGGGAGGGGTGGGAGTTGGGGGCGGGCCGGGCATCGCGATGGGCCCTGATGCCACCCCCACTCCTGTGTCCCAGATCATCGACCCCTTTGTGGAGGTGGAGATCATTGGGCTCCCTGTGGACTGCAGCAGGGAGCAGACCCGCGTGGTGGACGACAACGGGTTCAACCCCACCTGGGAGGAGACCCTGGTTTTCATGGTGCACATGCCGGAGATCGCGCTGGTCCGCTTCCTCGTCTGGGACCACGATCCCATCGGGCGTGACTTCATTGGCCAGAGGACGCTGGCCTTCAGCAGCATGATGCCAGGCTACAGACACGTGTACCTAGAAGGGATGGAAGAGGCCTCCATCTTCGTGCATGTGGCTGTCAGTGACATCAGCGGTAAGGTCAAGCAGGCTCTGGGCCTAAAAGGCCTCTTCCTCCGAGGCCCAAAGCCCGGCTCGCTGGACAGTCATGCTGCTGGGCGGCCCCCGGCCCGGCCCTCCGTTAGCCAGCGGATCCTGCGGCGCACGGCCAGCGCCCCGACCAAGAGCCAGAAGCCGGGCCGCAGGGGCTTCCCGGAGCTGGTCCTGGGTACACGGGACACAGGCTCCAAGGGGGTGGCAGACGATGTGGTGCCCCCCGGGCCCGGACCTGCTCCGGAAGCCCCAGCCCAGGAGGGGCCCGGCAGCGGCAGCCCCCGAGTTAGGAACTGAGAGCGGCGAGTGACAGACACCCGCCCCCTCTCCACGCAGCGGCCACTCCCCCCACTGTGCAGCCTGGAAACCATCGCTGAGGAGCCCGCCCCAGGCCCTGGTCCCCCGCCACCAGCGGCTGTCCCCACCAGCTCTTCTCAGGGACGGCCCCCATACCCCACAGGACCCGGAGCCAATGTGGCAAGCCCCCTAGAGGACACTGAGGAGCCCCGAGACAGCAGGCCTCGGCCGTGCAACGGCGAGGGCGCCGGCGGGGCATACGAGAGGGCCCCCGGCAGCCAGACGGACGGCAGGAGCCAGCCCCGGACCCTGGGCCACCTGCCCGTGATTAGAAGGGTGAAGAGTGAGGGGCAGGTGCCCACGGAGCCCCTGGGAGGGTGGCGGCCCCTGGCCGCTCCCTTTCCAGCTCCTGCCGTGTACTCCGATGCCACGGGCAGTGACCCGCTGTGGCAGCGGCTGGAGCCATGTGGCCACCGAGACAGCGTTTCCTCCTCCTCCAGCATGTCATCCAGCGACACTGTCATTGACCTCTCCCTGCCCAGCCTGGGCCTGGGCCGCAGCCGTGAGAACCTCGCTGGAGCCCACATGGGACGCCTGCCCCCCAGGCCCCACTCGGCTTCGGCTGCCCGCCCAGACCTGCCACCTGTGACCAAGAGCAAATCCAACCCCAACCTTCGGGCTACAGGCCAGCGGCCTCCCATACCTGACGAACTGCAGCCCAGGTCCCTGGCCCCAAGGATGGCTGGCCTCCCCTTCCGGCCTCCCTGGGGCTGCCTTTCCCTGGTGGGCGTGCAGGACTGCCCCGTGGCTGCCAAGTCCAAGAGCCTGGGCGACCTCACTGCTGATGACTTTGCCCCTAGCTTTGAGGGCGGCTCCCGCAGACTGAGCCACAGCCTGGGCCTCCCGGGAGGGACACGGCGGGTGTCGGGGCCAGGGGTGAGACGGGACACCCTGACAGAGCAGCTGCGCTGGCTCACTGTCTTCCAGCAGGCAGGAGACATCACGTCACCCACCAGCCTGGGCCCGGCTGGGGAGGGGGTGGCAGGGGGCCCTGGTTTTGTGCGGCGCTCCTCCTCCCGCAGCCACAGCCGCGTGCGTGCCATTGCCAGCCGGGCCCGCCAGGCCCAGGAGCGGCAGCAGAGACTGCAGGGCCTGGGCCGGCAGGGACCCCCAGAAGAGGAGCGGGGCACCCCCGAGGGCGCCTGCTCCGTGGGCCACGAGGGCAGTGTGGATGCACCAGCACCCTCCAAGGGAGCCCTCGGGCCAGCATCCGCGGCTGCTGAAAACCTGGTCCTGCTCCGCCTCTGACCGTCAGTGGTGGGAACCTGGGCGGCTCTGGAGGCCCAGGGCAGGGGTGGGCGTGTTGTTTGCTCAGGAAACAGGGCAGCCAGGCCCCCAAAACTGTGTCCCCCTGGCTGCCCTGTGTCCCCTCCACCCCTGCCTCCCTCCTGCCCCTGCTCCCGGGGAGGAAAGGCTAAAGCTGCTGGCCCGGGGCCCACAGGAGGGGCTTCGAGGCTGGCCCTGCCAGGCAGTTTTCCCGGCGTTTTAGGATCTGTACATAGAGAAATATTTAAATTTTTAGAAGCAAAACTTATACAACATTAAAATGATACCAAGTCCCTT +>ENST00000511072 +GGTGTCCAAACTGACAATGCTGGGGAGATGAAGATAGTGTGTGGCTGCTTCTGGACTCAAGGAGGAGGAGAGAGATTCCGCGAGCCGACACCATGCGATCCAAGGCGAGGGCGAGGAAGCTAGCCAAAAGTGACGGTGACGTTGTAAATAATATGTATGAGCCCAACCGGGACCTGCTGGCCAGCCACAGCGCGGAGGACGAGGCCGAGGACAGTGCCATGTCGCCCATCCCCGTGGGGCCACCGTCCCCCTTCCCCACCAGCGAGGACTTCACCCCCAAGGAGGGCTCGCCGTACGAGGCCCCTGTCTACATTCCTGAAGACATTCCGATCCCAGCAGACTTCGAGCTCCGAGAGTCCTCCATCCCAGGGGCTGGCCTGGGGGTCTGGGCCAAGAGGAAGATGGAAGCCGGGGAGAGGCTGGGCCCCTGCGTGGTGGTGCCCCGGGCGGCGGCAAAGGAGACAGACTTCGGATGGGAGCAAATACTGACGGACGTGGAAGTGTCGCCCCAGGAAGGCTGCATCACAAAGCAGATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAGATTTACTATAAAGTCATTAAGGACATTGAGCCAGGTGAGGAGCTGCTGGTGCACGTGAAGGAAGGCGTCTACCCCCTGGGCACAGTGCCGCCCGGCCTGGACGAGGAGCCCACGTTCCGCTGTGACGAGTGTGACGAACTCTTCCAGTCCAAGCTGGACCTGCGGCGCCATAAGAAGTACACGTGTGGCTCAGTGGGGGCTGCGCTCTACGAGGGCCTGGCTGAGGAGCTCAAGCCCGAGGGCCTTGGCGGTGGCAGCGGCCAAGCCCACGAGTGCAAGGACTGCGAGCGGATGTTCCCCAACAAGTACAGCCTGGAGCAGCACATGGTCATCCACACGGAGGAGCGCGAGTACAAATGCGACCAGTGTCCCAAGGCCTTCAACTGGAAGTCCAACCTCATCCGCCACCAGATGTCCCACGACAGCGGCAAACGCTTCGAATGTGAAAACTGCGTGAAGGTGTTCACGGACCCCAGCAACCTTCAGCGGCACATCCGCTCGCAGCACGTGGGCGCTCGGGCCCACGCCTGCCCCGACTGCGGGAAGACCTTCGCCACGTCCTCCGGCCTCAAGCAGCACAAGCATATCCACAGCACGGTGAAGCCTTTCATATGTGAGGTCTGCCACAAGTCCTACACGCAGTTCTCCAACCTGTGCCGGCACAAGCGGATGCACGCCGACTGCCGCACGCAGATCAAGTGCAAGGACTGTGGCCAGATGTTCAGCACTACCTCCTCCCTCAACAAGCACCGGCGCTTCTGCGAGGGCAAGAACCATTACACGCCGGGCGGCATCTTTGCCCCGGGCCTGCCCTTGACCCCCAGCCCCATGATGGACAAGGCAAAACCCTCCCCCAGCCTCAATCACGCCAGCCTGGGCTTCAACGAGTACTTTCCCTCCAGGCCGCACCCGGGGAGCCTGCCCTTCTCCACGGCGCCTCCCACGTTCCCCGCACTCACCCCCGGCTTCCCGGGCATCTTCCCTCCATCCTTGTACCCCCGGCCGCCTCTGCTACCTCCCACATCGCTGCTCAAGAGCCCCCTGAACCACACCCAGGACGCCAAGCTCCCCAGTCCCCTGGGGAACCCAGCCCTGCCCCTGGTCTCCGCCGTCAGCAACAGCAGCCAGGGCACGACGGCAGCTGCGGGGCCCGAGGAGAAGTTCGAGAGCCGCCTGGAGGACTCCTGTGTGGAGAAGCTGAAGACCAGGAGCAGCGACATGTCGGACGGCAGTGACTTTGAGGACGTCAACACCACCACGGGGACCGACCTGGACACGACCACGGGGACGGGCTCGGACCTGGACAGCGACGTGGACAGCGACCCTGACAAGGACAAGGGCAAGGGCAAGTCCGCCGAGGGCCAGCCCAAGTTTGGGGGCGGCTTGGCGCCCCCGGGGGCCCCGAACAGCGTGGCCGAGGTGCCTGTCTTCTATTCCCAGCACTCATTCTTCCCGCCACCCGACGAGCAGCTGCTGACTGCAACGGGCGCCGCCGGGGACTCCATCAAGGCCATCGCATCCATTGCCGAGAAGTACTTTGGCCCCGGCTTCATGGGGATGCAGGAGAAGAAGCTGGGCTCGCTCCCCTACCACTCGGCGTTCCCCTTCCAGTTCCTGCCCAACTTCCCCCACTCCCTTTACCCCTTCACGGACCGAGCCCTCGCCCACAACTTGCTGGTCAAGGCCGAGCCAAAGTCACCCCGGGACGCCCTCAAGGTGGGCGGCCCCAGTGCCGAGTGCCCCTTTGATCTCACCACCAAGCCCAAAGACGTGAAGCCCATCCTGCCCATGCCCAAGGGCCCCTCGGCCCCCGCATCCGGCGAGGAGCAGCCGCTGGACCTGAGCATCGGCAGCCGGGCCCGTGCCAGCCAAAACGGCGGCGGGCGGGAGCCCCGCAAGAACCACGTCTATGGGGAACGCAAGCTGGGCGCCGGCGAGGGGCTGCCCCAGGTGTGCCCGGCGCGGATGCCCCAGCAGCCCCCGCTCCACTACGCCAAGCCCTCGCCCTTCTTCATGGACCCCATCTACAGCAGGGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAGATGTCAGCCATAGAGACCATGACAGAGAAGCTGGAGAGCTTTGCAGCCATGAAGGCGGACTCGGGCAGCTCCCTGCAGCCCCTCCCCCACCACCCCTTCAACTTCCGGTCCCCACCCCCAACGCTCTCCGACCCCATCCTCAGGAAGGGCAAGGAGCGATACACGTGCAGGTACTGTGGGAAGATCTTCCCCAGATCAGCCAATCTCACCAGACACCTGAGGACGCACACTGGGGAGCAGCCGTACAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACGGGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAGGCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAATCAGCCAGTGGGCAGGTGGACGCTCTGCTGAGACAGAAGCTGGTGGCCACTGCCGGGTGCCCGCGTGGGGTCGCGGAAGGGAATGGATAGACTGGTGTGCTCAAAAGAGAGAGATCACTCAAATGATTTTTATAATGAAATGACAAGAATAACCCTTTTGGTAACCGTATTGACTGCAGAGTCTATTTAAGCATGTGGTTTTAAAAATAGACAGTATTTTTTAAAAATCAAAAAATGACTTGCAAAT +>ENST00000607632 +AATGCTGGGGAGATGAAGATAGTGTGTGGCTGCTTCTGGACTCAAGGAGGAGGAGAGAGATTCCGCGAGCCGACACCATGCGATCCAAGGCGAGGGCGAGGAAGCTAGCCAAAAGTGACGGTGACGTTGTAAATAATATGTATGAGCCCAACCGGGACCTGCTGGCCAGCCACAGCGCGGAGGACGAGGCCGAGGACAGTGCCATGTCGCCCATCCCCGTGGGGCCACCGTCCCCCTTCCCCACCAGCGAGGACTTCACCCCCAAGGAGGGCTCGCCGTACGAGGCCCCTGTCTACATTCCTGAAGACATTCCGATCCCAGCAGACTTCGAGCTCCGAGAGTCCTCCATCCCAGGGGCTGGCCTGGGGGTCTGGGCCAAGAGGAAGATGGAAGCCGGGGAGAGGCTGGGCCCCTGCGTGGTGGTGCCCCGGGCGGCGGCAAAGGAGACAGACTTCGGATGGGAGGTGAGCGATCGCGCCTGAGTATGATTGATCACGGCCATTTATCTTGTGTTCAATCTATTTATAAAGCCGGGCTGAGCAGCCACTGCCCGAGGCGGGAGGCGCGGCCAGAGAGAGCGT +>ENST00000378391 +GAAGATAGTGTGTGGCTGCTTCTGGACTCAAGGAGGAGGAGAGAGATTCCGCGAGCCGACACCATGCGATCCAAGGCGAGGGCGAGGAAGCTAGCCAAAAGTGACGGTGACGTTGTAAATAATATGTATGAGCCCAACCGGGACCTGCTGGCCAGCCACAGCGCGGAGGACGAGGCCGAGGACAGTGCCATGTCGCCCATCCCCGTGGGGCCACCGTCCCCCTTCCCCACCAGCGAGGACTTCACCCCCAAGGAGGGCTCGCCGTACGAGGCCCCTGTCTACATTCCTGAAGACATTCCGATCCCAGCAGACTTCGAGCTCCGAGAGTCCTCCATCCCAGGGGCTGGCCTGGGGGTCTGGGCCAAGAGGAAGATGGAAGCCGGGGAGAGGCTGGGCCCCTGCGTGGTGGTGCCCCGGGCGGCGGCAAAGGAGACAGACTTCGGATGGGAGCAAATACTGACGGACGTGGAAGTGTCGCCCCAGGAAGGCTGCATCACAAAGATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAGATTTACTATAAAGTCATTAAGGACATTGAGCCAGGTGAGGAGCTGCTGGTGCACGTGAAGGAAGGCGTCTACCCCCTGGGCACAGTGCCGCCCGGCCTGGACGAGGAGCCCACGTTCCGCTGTGACGAGTGTGACGAACTCTTCCAGTCCAAGCTGGACCTGCGGCGCCATAAGAAGTACACGTGTGGCTCAGTGGGGGCTGCGCTCTACGAGGGCCTGGCTGAGGAGCTCAAGCCCGAGGGCCTTGGCGGTGGCAGCGGCCAAGCCCACGAGTGCAAGGACTGCGAGCGGATGTTCCCCAACAAGTACAGCCTGGAGCAGCACATGGTCATCCACACGGAGGAGCGCGAGTACAAATGCGACCAGTGTCCCAAGGCCTTCAACTGGAAGTCCAACCTCATCCGCCACCAGATGTCCCACGACAGCGGCAAACGCTTCGAATGTGAAAACTGCGTGAAGGTGTTCACGGACCCCAGCAACCTTCAGCGGCACATCCGCTCGCAGCACGTGGGCGCTCGGGCCCACGCCTGCCCCGACTGCGGGAAGACCTTCGCCACGTCCTCCGGCCTCAAGCAGCACAAGCATATCCACAGCACGGTGAAGCCTTTCATATGTGAGGTCTGCCACAAGTCCTACACGCAGTTCTCCAACCTGTGCCGGCACAAGCGGATGCACGCCGACTGCCGCACGCAGATCAAGTGCAAGGACTGTGGCCAGATGTTCAGCACTACCTCCTCCCTCAACAAGCACCGGCGCTTCTGCGAGGGCAAGAACCATTACACGCCGGGCGGCATCTTTGCCCCGGGCCTGCCCTTGACCCCCAGCCCCATGATGGACAAGGCAAAACCCTCCCCCAGCCTCAATCACGCCAGCCTGGGCTTCAACGAGTACTTTCCCTCCAGGCCGCACCCGGGGAGCCTGCCCTTCTCCACGGCGCCTCCCACGTTCCCCGCACTCACCCCCGGCTTCCCGGGCATCTTCCCTCCATCCTTGTACCCCCGGCCGCCTCTGCTACCTCCCACATCGCTGCTCAAGAGCCCCCTGAACCACACCCAGGACGCCAAGCTCCCCAGTCCCCTGGGGAACCCAGCCCTGCCCCTGGTCTCCGCCGTCAGCAACAGCAGCCAGGGCACGACGGCAGCTGCGGGGCCCGAGGAGAAGTTCGAGAGCCGCCTGGAGGACTCCTGTGTGGAGAAGCTGAAGACCAGGAGCAGCGACATGTCGGACGGCAGTGACTTTGAGGACGTCAACACCACCACGGGGACCGACCTGGACACGACCACGGGGACGGGCTCGGACCTGGACAGCGACGTGGACAGCGACCCTGACAAGGACAAGGGCAAGGGCAAGTCCGCCGAGGGCCAGCCCAAGTTTGGGGGCGGCTTGGCGCCCCCGGGGGCCCCGAACAGCGTGGCCGAGGTGCCTGTCTTCTATTCCCAGCACTCATTCTTCCCGCCACCCGACGAGCAGCTGCTGACTGCAACGGGCGCCGCCGGGGACTCCATCAAGGCCATCGCATCCATTGCCGAGAAGTACTTTGGCCCCGGCTTCATGGGGATGCAGGAGAAGAAGCTGGGCTCGCTCCCCTACCACTCGGCGTTCCCCTTCCAGTTCCTGCCCAACTTCCCCCACTCCCTTTACCCCTTCACGGACCGAGCCCTCGCCCACAACTTGCTGGTCAAGGCCGAGCCAAAGTCACCCCGGGACGCCCTCAAGGTGGGCGGCCCCAGTGCCGAGTGCCCCTTTGATCTCACCACCAAGCCCAAAGACGTGAAGCCCATCCTGCCCATGCCCAAGGGCCCCTCGGCCCCCGCATCCGGCGAGGAGCAGCCGCTGGACCTGAGCATCGGCAGCCGGGCCCGTGCCAGCCAAAACGGCGGCGGGCGGGAGCCCCGCAAGAACCACGTCTATGGGGAACGCAAGCTGGGCGCCGGCGAGGGGCTGCCCCAGGTGTGCCCGGCGCGGATGCCCCAGCAGCCCCCGCTCCACTACGCCAAGCCCTCGCCCTTCTTCATGGACCCCATCTACAGCAGGGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAGATGTCAGCCATAGAGACCATGACAGAGAAGCTGGAGAGCTTTGCAGCCATGAAGGCGGACTCGGGCAGCTCCCTGCAGCCCCTCCCCCACCACCCCTTCAACTTCCGGTCCCCACCCCCAACGCTCTCCGACCCCATCCTCAGGAAGGGCAAGGAGCGATACACGTGCAGGTACTGTGGGAAGATCTTCCCCAGATCAGCCAATCTCACCAGACACCTGAGGACGCACACTGGGGAGCAGCCGTACAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACGGGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAGGTGTGCTGAGGACCACGAAGGCGGTCTGTTAGCTTTGGAGCCGATGCCGACTTTTGGGAAGGGGCTGGACCTCCGCAGAGCAGCTGAGGAAGCATTTGAAGTTAAAGATGTGCTTAATTCCACCTTAGATTCTGAGGCTTTAAAACATACACTGTGCAGGCAGGCTAAGAACCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAATCAGCCAGTGGGCAGGTGGACGCTCTGCTGAGACAGAAGCTGGTGGCCACTGCCGGGTGCCCGCGTGGGGTCGCGGAAGGGAATGGATAGACTGGTGTGCTCAAAAGAGAGAGATCACTCAAATGATTTTTATAATGAAATGACAAGAATAACCCTTTTGGTAACCGTATTGACTGCAGAGTCTATTTAAGCATGTGGTTTTAAAAATAGACAGTATTTTTTAAAAATCAAAAAATGACTTGCAAATTGTTTTTTAAAAGTAATTTTGCATTGCTTTGAAATTTGAGCTCATTTGCAAACCCGAGTCTGCCTGGGAACCCGCACTGTGCCTGGGTGTATTCTTTATACTGTAGATAATGGAGAAATTTTCTATCTCTGTCCCTATTTGTATAAGCCAAGGTGATGCTGGGTGCCCCGAGGCAGAACAAGAGGCGCGGGGCCACACCCGTGAACCATGCAGACGGCCGAAGAAGTCTTAGGCAGGGCGCCCTGGGCTGCAGGCCTGCCCGAGGCTGGGATGGGAAGTGTGCCTGCCCTCGTGTGACATGGAATTGGTGTCAGGACCGCCACGTGGCCTTCAGAGGAATCCACAGGTCCCCACCCAAGATCCCTCAATTATATGGGGAAGTCGAGGGCCTGTGGCTTGGATCCGCCATGCAGAGATGTGGCCGGGCACCCATCTTCCTTCCCTCCTCTGTCCCTGCCTCGGCCACCCCACGCGGGAACCCAGCGCCGTCCTCTGAAGGCAGGGCCTTGGCCACGTCCTGGGTCTCCCACCTCCCACCTGACCCCAGCGGCTCCGGTGTCCTCCACGTGGCTGCCCTGGGGAGCAATCCCAGCGGATCGCTCCGGGCCACCAAGCCGCACCTGTGCCTGAGACTCCGGATGGACGACACAGTCGTCACGTCGCTCTTCCTGCGGGTTCTTGGCGAGACACAGCTTGAGAACAGAAGGGCGTCGGGGGAACCTGCCGCAAGGAGCAGAGACAGCACAGCCCCCCGGGCCCAGCCGCCTCCCTCTCTTGGGACGCAACTTCTTCCCCACTCGGATGGGCTTTAAATTATTCCCATAGGGGCCAATTTCAAATAATAATTTTTTTCCCTGATGGAATTTACCTTAATCTGTATATAACTTGTAATTTTTTCTAATTCATTTCTTTTCTTATTTTATTTCCTCCTTAACAGTATTTTTGGCATTAGACATTCTTATTGTGAAGAAATAATGTTAATATAAGTATCTGGTGAAGGACCAAAACCGTGTGATAAGGTTGTGTGTCGTGTGGGAGTGGGGCGATTTTTTATGTGCCAAATACCCCCGTCCCCCCCA +>ENST00000514189 +GCTGCTTCTGGACTCAAGGAGGAGGAGAGAGATTCCGCGAGCCGACACCATGCGATCCAAGGCGAGGGCGAGGAAGCTAGCCAAAAGTGACGGTGACGTTGTAAATAATATGTATGAGCCCAACCGGGACCTGCTGGCCAGCCACAGCGCGGAGGACGAGGCCGAGGACAGTGCCATGTCGCCCATCCCCGTGGGGCCACCGTCCCCCTTCCCCACCAGCGAGGACTTCACCCCCAAGGAGGGCTCGCCGTACGAGGCCCCTGTCTACATTCCTGAAGACATTCCGATCCCAGCAGACTTCGAGCTCCGAGAGTCCTCCATCCCAGGGGCTGGCCTGGGGGTCTGGGCCAAGAGGAAGATGGAAGCCGGGGAGAGGCTGGGCCCCTGCGTGGTGGTGCCCCGGGCGGCGGCAAAGGAGACAGACTTCGGATGGGAGCAAATACTGACGGACGTGGAAGTGTCGCCCCAGGAAGGCTGCATCACAAAGCAGATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAGATTTACTATAAAGTCATTAAGGACATTGAGCCAGGTGAGGAGCTGCTGGTGCACGTGAAGGAAGGCGTCTACCCCCTGGGCACAGTGCCGCCCGGCCTGGACGAGGAGCCCACGTTCCGCTGTGACGAGTGTGACGAACTCTTCCAGTCCAAGCTGGACCTGCGGCGCCATAAGAAGTACACGTGTGGCTCAGTGGGGGCTGCGCTCTACGAGGGCCTGGCTGAGGAGCTCAAGCCCGAGGGCCTTGGCGGTGGCAGCGGCCAAGCCCACGAGTGCAAGGACTGCGAGCGGATGTTCCCCAACAAGTACAGCCTGGAGCAGCACATGGTCATCCACACGGAGGAGCGCGAGTACAAATGCGACCAGTGTCCCAAGGCCTTCAACTGGAAGTCCAACCTCATCCGCCACCAGATGTCCCACGACAGCGGCAAACGCTTCGAATGTGAAAACTGCGTGAAGGTGTTCACGGACCCCAGCAACCTTCAGCGGCACATCCGCTCGCAGCACGTGGGCGCTCGGGCCCACGCCTGCCCCGACTGCGGGAAGACCTTCGCCACGTCCTCCGGCCTCAAGCAGCACAAGCATATCCACAGCACGGTGAAGCCTTTCATATGTGAGGTCTGCCACAAGTCCTACACGCAGTTCTCCAACCTGTGCCGGCACAAGCGGATGCACGCCGACTGCCGCACGCAGATCAAGTGCAAGGACTGTGGCCAGATGTTCAGCACTACCTCCTCCCTCAACAAGCACCGGCGCTTCTGCGAGGGCAAGAACCATTACACGCCGGGCGGCATCTTTGCCCCGGGCCTGCCCTTGACCCCCAGCCCCATGATGGACAAGGCAAAACCCTCCCCCAGCCTCAATCACGCCAGCCTGGGCTTCAACGAGTACTTTCCCTCCAGGCCGCACCCGGGGAGCCTGCCCTTCTCCACGGCGCCTCCCACGTTCCCCGCACTCACCCCCGGCTTCCCGGGCATCTTCCCTCCATCCTTGTACCCCCGGCCGCCTCTGCTACCTCCCACATCGCTGCTCAAGAGCCCCCTGAACCACACCCAGGACGCCAAGCTCCCCAGTCCCCTGGGGAACCCAGCCCTGCCCCTGGTCTCCGCCGTCAGCAACAGCAGCCAGGGCACGACGGCAGCTGCGGGGCCCGAGGAGAAGTTCGAGAGCCGCCTGGAGGACTCCTGTGTGGAGAAGCTGAAGACCAGGAGCAGCGACATGTCGGACGGCAGTGACTTTGAGGACGTCAACACCACCACGGGGACCGACCTGGACACGACCACGGGGACGGGCTCGGACCTGGACAGCGACGTGGACAGCGACCCTGACAAGGACAAGGGCAAGGGCAAGTCCGCCGAGGGCCAGCCCAAGTTTGGGGGCGGCTTGGCGCCCCCGGGGGCCCCGAACAGCGTGGCCGAGGTGCCTGTCTTCTATTCCCAGCACTCATTCTTCCCGCCACCCGACGAGCAGCTGCTGACTGCAACGGGCGCCGCCGGGGACTCCATCAAGGCCATCGCATCCATTGCCGAGAAGTACTTTGGCCCCGGCTTCATGGGGATGCAGGAGAAGAAGCTGGGCTCGCTCCCCTACCACTCGGCGTTCCCCTTCCAGTTCCTGCCCAACTTCCCCCACTCCCTTTACCCCTTCACGGACCGAGCCCTCGCCCACAACTTGCTGGTCAAGGCCGAGCCAAAGTCACCCCGGGACGCCCTCAAGGTGGGCGGCCCCAGTGCCGAGTGCCCCTTTGATCTCACCACCAAGCCCAAAGACGTGAAGCCCATCCTGCCCATGCCCAAGGGCCCCTCGGCCCCCGCATCCGGCGAGGAGCAGCCGCTGGACCTGAGCATCGGCAGCCGGGCCCGTGCCAGCCAAAACGGCGGCGGGCGGGAGCCCCGCAAGAACCACGTCTATGGGGAACGCAAGCTGGGCGCCGGCGAGGGGCTGCCCCAGGTGTGCCCGGCGCGGATGCCCCAGCAGCCCCCGCTCCACTACGCCAAGCCCTCGCCCTTCTTCATGGACCCCATCTACAGGGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAGATGTCAGCCATAGAGACCATGACAGAGAAGCTGGAGAGCTTTGCAGCCATGAAGGCGGACTCGGGCAGCTCCCTGCAGCCCCTCCCCCACCACCCCTTCAACTTCCGGTCCCCACCCCCAACGCTCTCCGACCCCATCCTCAGGAAGGGCAAGGAGCGATACACGTGCAGGTACTGTGGGAAGATCTTCCCCAGATCAGCCAATCTCACCAGACACCTGAGGACGCACACTGGGGAGCAGCCGTACAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACGGGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAGGCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAATCAGCCAGTGGGCAGGTGGACGCTCTGCTGAGACAGAAGCTGGTGGCCACTGCCGGGTGCCCGCGTGGGGTCGCGGAAGGGAATGGATAGACTGGTGTGCTCAAAAGAGAGAGATCACTCAAATGATTTTTATAATGAAATGACAAGAATAACCCTTTTGGTAACCGTATTGACTGCAGAGTCTATTTAAGCATGTGGTTTTAAAAATAGACAGTATTTTTTAAAAATCAAAAAATGACTTGCAAAT +>ENST00000270722 +GCTGCTTCTGGACTCAAGGAGGAGGAGAGAGATTCCGCGAGCCGACACCATGCGATCCAAGGCGAGGGCGAGGAAGCTAGCCAAAAGTGACGGTGACGTTGTAAATAATATGTATGAGCCCAACCGGGACCTGCTGGCCAGCCACAGCGCGGAGGACGAGGCCGAGGACAGTGCCATGTCGCCCATCCCCGTGGGGCCACCGTCCCCCTTCCCCACCAGCGAGGACTTCACCCCCAAGGAGGGCTCGCCGTACGAGGCCCCTGTCTACATTCCTGAAGACATTCCGATCCCAGCAGACTTCGAGCTCCGAGAGTCCTCCATCCCAGGGGCTGGCCTGGGGGTCTGGGCCAAGAGGAAGATGGAAGCCGGGGAGAGGCTGGGCCCCTGCGTGGTGGTGCCCCGGGCGGCGGCAAAGGAGACAGACTTCGGATGGGAGCAAATACTGACGGACGTGGAAGTGTCGCCCCAGGAAGGCTGCATCACAAAGATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAGATTTACTATAAAGTCATTAAGGACATTGAGCCAGGTGAGGAGCTGCTGGTGCACGTGAAGGAAGGCGTCTACCCCCTGGGCACAGTGCCGCCCGGCCTGGACGAGGAGCCCACGTTCCGCTGTGACGAGTGTGACGAACTCTTCCAGTCCAAGCTGGACCTGCGGCGCCATAAGAAGTACACGTGTGGCTCAGTGGGGGCTGCGCTCTACGAGGGCCTGGCTGAGGAGCTCAAGCCCGAGGGCCTTGGCGGTGGCAGCGGCCAAGCCCACGAGTGCAAGGACTGCGAGCGGATGTTCCCCAACAAGTACAGCCTGGAGCAGCACATGGTCATCCACACGGAGGAGCGCGAGTACAAATGCGACCAGTGTCCCAAGGCCTTCAACTGGAAGTCCAACCTCATCCGCCACCAGATGTCCCACGACAGCGGCAAACGCTTCGAATGTGAAAACTGCGTGAAGGTGTTCACGGACCCCAGCAACCTTCAGCGGCACATCCGCTCGCAGCACGTGGGCGCTCGGGCCCACGCCTGCCCCGACTGCGGGAAGACCTTCGCCACGTCCTCCGGCCTCAAGCAGCACAAGCATATCCACAGCACGGTGAAGCCTTTCATATGTGAGGTCTGCCACAAGTCCTACACGCAGTTCTCCAACCTGTGCCGGCACAAGCGGATGCACGCCGACTGCCGCACGCAGATCAAGTGCAAGGACTGTGGCCAGATGTTCAGCACTACCTCCTCCCTCAACAAGCACCGGCGCTTCTGCGAGGGCAAGAACCATTACACGCCGGGCGGCATCTTTGCCCCGGGCCTGCCCTTGACCCCCAGCCCCATGATGGACAAGGCAAAACCCTCCCCCAGCCTCAATCACGCCAGCCTGGGCTTCAACGAGTACTTTCCCTCCAGGCCGCACCCGGGGAGCCTGCCCTTCTCCACGGCGCCTCCCACGTTCCCCGCACTCACCCCCGGCTTCCCGGGCATCTTCCCTCCATCCTTGTACCCCCGGCCGCCTCTGCTACCTCCCACATCGCTGCTCAAGAGCCCCCTGAACCACACCCAGGACGCCAAGCTCCCCAGTCCCCTGGGGAACCCAGCCCTGCCCCTGGTCTCCGCCGTCAGCAACAGCAGCCAGGGCACGACGGCAGCTGCGGGGCCCGAGGAGAAGTTCGAGAGCCGCCTGGAGGACTCCTGTGTGGAGAAGCTGAAGACCAGGAGCAGCGACATGTCGGACGGCAGTGACTTTGAGGACGTCAACACCACCACGGGGACCGACCTGGACACGACCACGGGGACGGGCTCGGACCTGGACAGCGACGTGGACAGCGACCCTGACAAGGACAAGGGCAAGGGCAAGTCCGCCGAGGGCCAGCCCAAGTTTGGGGGCGGCTTGGCGCCCCCGGGGGCCCCGAACAGCGTGGCCGAGGTGCCTGTCTTCTATTCCCAGCACTCATTCTTCCCGCCACCCGACGAGCAGCTGCTGACTGCAACGGGCGCCGCCGGGGACTCCATCAAGGCCATCGCATCCATTGCCGAGAAGTACTTTGGCCCCGGCTTCATGGGGATGCAGGAGAAGAAGCTGGGCTCGCTCCCCTACCACTCGGCGTTCCCCTTCCAGTTCCTGCCCAACTTCCCCCACTCCCTTTACCCCTTCACGGACCGAGCCCTCGCCCACAACTTGCTGGTCAAGGCCGAGCCAAAGTCACCCCGGGACGCCCTCAAGGTGGGCGGCCCCAGTGCCGAGTGCCCCTTTGATCTCACCACCAAGCCCAAAGACGTGAAGCCCATCCTGCCCATGCCCAAGGGCCCCTCGGCCCCCGCATCCGGCGAGGAGCAGCCGCTGGACCTGAGCATCGGCAGCCGGGCCCGTGCCAGCCAAAACGGCGGCGGGCGGGAGCCCCGCAAGAACCACGTCTATGGGGAACGCAAGCTGGGCGCCGGCGAGGGGCTGCCCCAGGTGTGCCCGGCGCGGATGCCCCAGCAGCCCCCGCTCCACTACGCCAAGCCCTCGCCCTTCTTCATGGACCCCATCTACAGCAGGGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAGATGTCAGCCATAGAGACCATGACAGAGAAGCTGGAGAGCTTTGCAGCCATGAAGGCGGACTCGGGCAGCTCCCTGCAGCCCCTCCCCCACCACCCCTTCAACTTCCGGTCCCCACCCCCAACGCTCTCCGACCCCATCCTCAGGAAGGGCAAGGAGCGATACACGTGCAGGTACTGTGGGAAGATCTTCCCCAGATCAGCCAATCTCACCAGACACCTGAGGACGCACACTGGGGAGCAGCCGTACAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACGGGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAGGTGTGCTGAGGACCACGAAGGCGGTCTGTTAGCTTTGGAGCCGATGCCGACTTTTGGGAAGGGGCTGGACCTCCGCAGAGCAGCTGAGGAAGCATTTGAAGTTAAAGATGTGCTTAATTCCACCTTAGATTCTGAGGCTTTAAAACATACACTGTGCAGGCAGGCTAAGAACCAGGCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAATCAGCCAGTGGGCAGGTGGACGCTCTGCTGAGACAGAAGCTGGTGGCCACTGCCGGGTGCCCGCGTGGGGTCGCGGAAGGGAATGGATAGACTGGTGTGCTCAAAAGAGAGAGATCACTCAAATGATTTTTATAATGAAATGACAAGAATAACCCTTTTGGTAACCGTATTGACTGCAGAGTCTATTTAAGCATGTGGTTTTAAAAATAGACAGTATTTTTTAAAAATCAAAAAATGACTTGCAAATTGTTTTTTAAAAGTAATTTTGCATTGCTTTGAAATTTGAGCTCATTTGCAAACCCGAGTCTGCCTGGGAACCCGCACTGTGCCTGGGTGTATTCTTTATACTGTAGATAATGGAGAAATTTTCTATCTCTGTCCCTATTTGTATAAGCCAAGGTGATGCTGGGTGCCCCGAGGCAGAACAAGAGGCGCGGGGCCACACCCGTGAACCATGCAGACGGCCGAAGAAGTCTTAGGCAGGGCGCCCTGGGCTGCAGGCCTGCCCGAGGCTGGGATGGGAAGTGTGCCTGCCCTCGTGTGACATGGAATTGGTGTCAGGACCGCCACGTGGCCTTCAGAGGAATCCACAGGTCCCCACCCAAGATCCCTCAATTATATGGGGAAGTCGAGGGCCTGTGGCTTGGATCCGCCATGCAGAGATGTGGCCGGGCACCCATCTTCCTTCCCTCCTCTGTCCCTGCCTCGGCCACCCCACGCGGGAACCCAGCGCCGTCCTCTGAAGGCAGGGCCTTGGCCACGTCCTGGGTCTCCCACCTCCCACCTGACCCCAGCGGCTCCGGTGTCCTCCACGTGGCTGCCCTGGGGAGCAATCCCAGCGGATCGCTCCGGGCCACCAAGCCGCACCTGTGCCTGAGACTCCGGATGGACGACACAGTCGTCACGTCGCTCTTCCTGCGGGTTCTTGGCGAGACACAGCTTGAGAACAGAAGGGCGTCGGGGGAACCTGCCGCAAGGAGCAGAGACAGCACAGCCCCCCGGGCCCAGCCGCCTCCCTCTCTTGGGACGCAACTTCTTCCCCACTCGGATGGGCTTTAAATTATTCCCATAGGGGCCAATTTCAAATAATAATTTTTTTCCCTGATGGAATTTACCTTAATCTGTATATAACTTGTAATTTTTTCTAATTCATTTCTTTTCTTATTTTATTTCCTCCTTAACAGTATTTTTGGCATTAGACATTCTTATTGTGAAGAAATAATGTTAATATAAGTATCTGGTGAAGGACCAAAACCGTGTGATAAGGTTGTGTGTCGTGTGGGAGTGGGGCGATTTTTTATGTGCCAAATACCCCCGTCCCCCCCATGAATCCTGCTGTCCCTGCTGCCGTTTACCAGACAATCATATGTTTTTGTTAAATTTGCGTTTCAGTTACATTTGCATTTAAGACAAGTGTTCTATTTATTTCTTGTATTGTTTGGAAGAAAAAATGATGATAGAGTCCCAAAAAGAAGAGAAAAAAAATGCCCAAGTTGCCCTTTAAAAAAAAAGAGCGTAAATACAAACAGGAGTGGTGCAAGCCGCCTTGGTGTGGGTTTGTGTCACGTGTGGACATCTCCTCAGGCTTTGTGTCACGCGTGGACATCTCCTCAGGCTGTCCCCAGCGGTGACGGGAGGTGTCCTGGCTGCTCCAGGACAAAAGACAATCGTCTCTGTGGGTGCCGGGTGGTCCAGGCTTGCACTGAAGACGTGCCACGGGGAGGCTCCTGCAGGAGGCTCAACCCGACGGATCACAGTGAAAGGGATTCCTCCCACGCCAGATCTGCACAACGAGGCAAGACAGGACCCACCTGTGCGTGCGCTGGGGCCATGGGGTGGCCCCGCCGGGGCAGCGGGGGAGCTGCCTGCAGAAGAGCCAGCTGGCGTGTCGGGAAGGATCCAGGATCTGCAAACACAACTGCTCAGGCCTTCTCACGCGTTTCCACAACATCCCCTGGGTCAGACCCACCAGGTACCCCGTAGGAATTTCCAGTTTCCCTTGATCTAGATGGGATTCTTATAAAAATTCAACCTCAGACATAAACACCCCATTTCTGTAAACCCAAATTATATGGTTTCTTCTGCGAAAGAGTAAGGTGTGTGCTTTTTTTTTTTTGCAATATGACCCCGTCTCTCTGAAGTGGGACATTCGGACGGATGGAGCCCTCAGCGTGTCTTTTCAGCAGGAGCAGAACCGATGAGAGCCGCCCTTACCGTTGGTCTCCGGATCCCCCAGTCCCATCCCGCCGTTTTCGGCTGTCTTCCTAACCGTCCTGTCTTCTCTTGGCGCTCTTTCCTTCCACCTTTCCCAAGAGTCCTGGTTGCACGTTTTAAGTCATATATTTTCGTCCCCCTGAAAATGATGGCAAGCCCAGTTTCTCCTGAGCATTCAGACCCCCAGGCCCCAGCACTTGGCGTTTTCAGGAGGCCCTGTTCTTAGAGCCCCTGACAAAGGCAGCACTTATTTCCTGGGCTGGTGCGCCCCAAAACACGGCCCCGACACTTAGTGTGGCCCCAGGCCCCAGCGAGCCTCGCCCTCCCAGTTTTGCTCTGCCCAGCAGTGTTGGTGCCCAGAGATGACAAGGGCCAGGGAGCCTGGCCCGGGTGTGAGAATTCAGAGATTCTGGCCTCCAGCTGTCACCACACCGTAACGGGGCCATGTAACTGTGCAGCATGGACAGGGATGCGACGGGGCAGCTGGCTGTGTCCATGGCCAGGTGGCCAGGGTCAGGGCTGCAAGCCAGGGGTCCAGGGCCCTTCCGTTCAGCCCAAATGCTGCCCCAATGCTAACTCCTTGGATTGTCAACCCCCATCCCCCAAATGGAAATTCCGAAGGAGGCCTCCTCGCACCTGCCCTCCGCTGCTCCTCAGACCCCAGCCCCCAGCGAGCCGACGTCCCCACCCGTTCCTGCTCTCATCCCCAGGTTGGGCACGTGGGGTTCCTCCTCTGTGGGCCTGGCAGACCCTTCATGAGTGGGACCCAAGATATCACTGACTTCAACCCAGAGGATCGAGCCCCTGCACCCTGCCTGGGGCCCTGGGGTGTGGAGCAGTGGCTGGGGTGGGCGTGGTGTGGCCTGAGAGACTGCCCAGCTGGAGAGGCCTTCCTTTACAAGGCCACGCGTGCAGCTGTCCCATCCAGACCCCGACTGGCCAAGACCTCCACGTCCCCAGAGTCCAGCCCTGGAAATTCCAAGGGCCCTGGCGTCCTCTGCCTTCCCCGCTTCCCCATGAGCGTCTGCAAAACACTTGCCTGAATACATATCACGTATTTTAGACTCGAAGCCTCAAAGCACTGGATTGTGGTCCCCTGCCCCCTCTGTCCCGTCCCCCTGCCCAAGTGACTGAAACCTACTGAGCTATATTCACTGTGCTGTCCTAGGGGGAGGGAGAGCAGAGCTCGCCCCTGCACTGCAGCCTTGTGGGGGAGGGCAAGGCTCTCCTCCCAGCCAGGGACGCCAGGACATAGCTGCTCCTGGTCAGTGGAGGTCAGCCGGGTATCAAAAGCCATGAAACTGTGTCTCTGTAGCAATGAGTGATACTGTGACAAAACCATCCTTGCATTCTTCCTAGAAGAGTTCCTCTGCTCCTTCCATTCCATTTTTGTGTTTGTTTTGTTCTTTTCTGTCACTGATCCGTATTACCACTTTTGGAAAAAAATAAATAAATAAATAAATAAAAGGCAGCTTGAGTTTCCAAACGTGTGATTCACTTGTGAACAAAAGTCATTCTAACAATTGCCTTCAGCGTCACGTGCATTGCCACTGCGCTTTCGGCACGAGGGATGCTGAGCCCTGGTGTCAGAGTCGTAATTTAAAGCGTGTGTGTATATGGACTTTGTCCCTTAAGGTCGATATAAAGAATCCTCGCAGAATCACAGACCTGTGCCGCCCGCCACCTTCTGCCATTGTTACATTACAGATTTGGTTTAGTTTTGTTTTGTTTTGTTTTTTCTTTTAGAACTGTATAGTATTGAAAAAGAAATCAAATGTAAATGTCTGGTTTTCATATAATGTTTAAAAAGACCATTGAGAAGGAGGCTGGCGCTCGCCCCATGTCCCCCTTGATTGTAAATTGCTTCTGTTCTGTTTATAAGTAAACTGTGCATGACTCCTGCTTAGCGGTCATTATCGTGTCTGTTGGTGAAATTTTTATTAAAAGGAAAATTCTGTAGATGCACTTATTGAATATGTGATTAGGATCTACGTCTGAGACTAGGAGTCCTGAACTGCTGACGCGAAAGAGGCGCAGTTCCCAATTAATACGGAAATCGCTGTGGGAGAAGAATGAAATAAGACGTGAAGTGTAGGAAATCATGAAAAGAACAATTTTGCAAATTGCATTCTGATGCTTGTGATGAACACAAATGTACTTGTGTAGAGACATTTCCTTAAGAGAAAGCCTAGGAGAAGCCGATTTGGAGGTTAATGCTGTAGAATAGGACTGTATACCAAATGTAATCTTTCCAATGCTCCAATGAATTTATACATGAGATTGATATGCAATAAATCTGTGTGCTTTTCTAA +>ENST00000512462 +AAGCACAAGGCCCCATCTCACCAGGTCAGCGGAGATGCTGCCTGCCTGGAGCTCGGGTCCCATGGGGTTGGGGGCGAAGATGCTGCATCCCAGTGCTGTTCCCTGCTCGGGGCCCTGGAAGCAGAGCGGCCTGGCTTCTCTCATTGGCCAAAGAGGGTTTGGAAGCAAATACTGACGGACGTGGAAGTGTCGCCCCAGGAAGGCTGCATCACAAAGATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAGATTTACTATAAAGTCATTAAGGACATTGAGCCAGGTGAGGAGCTGCTGGTGCACGTGAAGGAAGGCGTCTACCCCCTGGGCACAGTGCCGCCCGGCCTGGACGAGGAGCCCACGTTCCGCTGTGACGAGTGTGACGAACTCTTCCAGTCCAAGCTGGACCTGCGGCGCCATAAGAAGTACACGTGTGGCTCAGTGGGGGCTGCGCTCTACGAGGGCCTGGCTGAGGAGCTCAAGCCCGAGGGCCTTGGCGGTGGCAGCGGCCAAGCCCACGAGTGCAAGGACTGCGAGCGGATGTTCCCCAACAAGTACAGCCTGGAGCAGCACATGGTCATCCACACGGAGGAGCGCGAGTACAAATGCGACCAGTGTCCCAAGGCCTTCAACTGGAAGTCCAACCTCATCCGCCACCAGATGTCCCACGACAGCGGCAAACGCTTCGAATGTGAAAACTGCGTGAAGGTGTTCACGGACCCCAGCAACCTTCAGCGGCACATCCGCTCGCAGCACGTGGGCGCTCGGGCCCACGCCTGCCCCGACTGCGGGAAGACCTTCGCCACGTCCTCCGGCCTCAAGCAGCACAAGCATATCCACAGCACGGTGAAGCCTTTCATATGTGAGGTCTGCCACAAGTCCTACACGCAGTTCTCCAACCTGTGCCGGCACAAGCGGATGCACGCCGACTGCCGCACGCAGATCAAGTGCAAGGACTGTGGCCAGATGTTCAGCACTACCTCCTCCCTCAACAAGCACCGGCGCTTCTGCGAGGGCAAGAACCATTACACGCCGGGCGGCATCTTTGCCCCGGGCCTGCCCTTGACCCCCAGCCCCATGATGGACAAGGCAAAACCCTCCCCCAGCCTCAATCACGCCAGCCTGGGCTTCAACGAGTACTTTCCCTCCAGGCCGCACCCGGGGAGCCTGCCCTTCTCCACGGCGCCTCCCACGTTCCCCGCACTCACCCCCGGCTTCCCGGGCATCTTCCCTCCATCCTTGTACCCCCGGCCGCCTCTGCTACCTCCCACATCGCTGCTCAAGAGCCCCCTGAACCACACCCAGGACGCCAAGCTCCCCAGTCCCCTGGGGAACCCAGCCCTGCCCCTGGTCTCCGCCGTCAGCAACAGCAGCCAGGGCACGACGGCAGCTGCGGGGCCCGAGGAGAAGTTCGAGAGCCGCCTGGAGGACTCCTGTGTGGAGAAGCTGAAGACCAGGAGCAGCGACATGTCGGACGGCAGTGACTTTGAGGACGTCAACACCACCACGGGGACCGACCTGGACACGACCACGGGGACGGGCTCGGACCTGGACAGCGACGTGGACAGCGACCCTGACAAGGACAAGGGCAAGGGCAAGTCCGCCGAGGGCCAGCCCAAGTTTGGGGGCGGCTTGGCGCCCCCGGGGGCCCCGAACAGCGTGGCCGAGGTGCCTGTCTTCTATTCCCAGCACTCATTCTTCCCGCCACCCGACGAGCAGCTGCTGACTGCAACGGGCGCCGCCGGGGACTCCATCAAGGCCATCGCATCCATTGCCGAGAAGTACTTTGGCCCCGGCTTCATGGGGATGCAGGAGAAGAAGCTGGGCTCGCTCCCCTACCACTCGGCGTTCCCCTTCCAGTTCCTGCCCAACTTCCCCCACTCCCTTTACCCCTTCACGGACCGAGCCCTCGCCCACAACTTGCTGGTCAAGGCCGAGCCAAAGTCACCCCGGGACGCCCTCAAGGTGGGCGGCCCCAGTGCCGAGTGCCCCTTTGATCTCACCACCAAGCCCAAAGACGTGAAGCCCATCCTGCCCATGCCCAAGGGCCCCTCGGCCCCCGCATCCGGCGAGGAGCAGCCGCTGGACCTGAGCATCGGCAGCCGGGCCCGTGCCAGCCAAAACGGCGGCGGGCGGGAGCCCCGCAAGAACCACGTCTATGGGGAACGCAAGCTGGGCGCCGGCGAGGGGCTGCCCCAGGTGTGCCCGGCGCGGATGCCCCAGCAGCCCCCGCTCCACTACGCCAAGCCCTCGCCCTTCTTCATGGACCCCATCTACAGCAGGGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAGATGTCAGCCATAGAGACCATGACAGAGAAGCTGGAGAGCTTTGCAGCCATGAAGGCGGACTCGGGCAGCTCCCTGCAGCCCCTCCCCCACCACCCCTTCAACTTCCGGTCCCCACCCCCAACGCTCTCCGACCCCATCCTCAGGAAGGGCAAGGAGCGATACACGTGCAGGTACTGTGGGAAGATCTTCCCCAGATCAGCCAATCTCACCAGACACCTGAGGACGCACACTGGGGAGCAGCCGTACAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACGGGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAGGTGTGCTGAGGACCACGAAGGCGGTCTGTTAGCTTTGGAGCCGATGCCGACTTTTGGGAAGGGGCTGGACCTCCGCAGAGCAGCTGAGGAAGCATTTGAAGTTAAAGATGTGCTTAATTCCACCTTAGATTCTGAGGCTTTAAAACATACACTGTGCAGGCAGGCTAAGAACCAGGCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCT +>ENST00000463591 +ACAAAGATCTCCGAAGACCTGGGCAGTGAGAAGTTCTGCGTGGATGCAAATCAGGCGGGGGCTGGCAGCTGGCTCAAGTACATCCGTGTGGCGTGCTCCTGCGATGACCAGAACCTCACCATGTGTCAGATCAGTGAGCAGATGAAAGTGAAATTGGAGTGAAGGAAAATTGGGCTTGAGGCGCATAGAAGGACGGTCTTTCCGTCCCCTTCTGGGGCTCAGATTTGCAGAGTGTGTCCTTAGTCGTCCGTTGGGAAGCTGACGGGCAGGGGCACCGCGGGGCTGGGCCAGGGCTGTGCTTTTGTGAGATGCAAACTATAGTAATGAAGGGCCCAGATTTTTTTTATTTAAGAAATAAATGTTTATTAGAACTTTTGAACTAAA +>ENST00000509860 +ATTTACTATAAAGTCATTAAGGACATTGAGCCAGGTGAGGAGCTGCTGGTGCACGTGAAGGAAGGCGTCTACCCCCTGGGCACAGTGCCGCCCGGCCTGGACGAGGAGCCCACGTTCCGCTGTGACGAGTGTGACGAACTCTTCCAGTCCAAGCTGGACCTGCGGCGCCATAAGAAGTACACGTGTGGCTCAGTGGGGGCTGCGCTCTACGAGGGCCTGGCTGAGGAGCTCAAGCCCGAGGGCCTTGGCGGTGGCAGCGGCCAAGCCCACGAGTGCAAGGACTGCGAGCGGATGTTCCCCAACAAGTACAGCCTGGAGCAGCACATGGTCATCCACACGGAGGAGCGCGAGTACAAATGCGACCAGTGTCCCAAGGCCTTCAACTGGAAGTCCAACCTCATCCGCCACCAGATGTCCCACGACAGCGGCAAACGCTTCGAATGTGAAAACTGCGTGAAGGTGTTCACGGACCCCAGCAACCTTCAGCGGCACATCCGCTCGCAGCACGTGGGCGCTCGGGCCCACGCCTGCCCCGACTGCGGGAAGACCTTCGCCACGTCCTCCGGCCTCAAGCAGCACAAGCATATCCACAGCACGGTGAAGCCTTTCATATGTGAGGTCTGCCACAAGTCCTACACGCAGTTCTCCAACCTGTGCCGGCACAAGCGGATGCACGCCGACTGCCGCACGCAGATCAAGTGCAAGGACTGTGGCCAGATGTTCAGCACTACCTCCTCCCTCAACAAGCACCGGCGCTTCTGCGAGGGCAAGAACCATTACACGCCGGGCGGCATCTTTGCCCCGGGCCTGCCCTTGACCCCCAGCCCCATGATGGACAAGGCAAAACCCTCCCCCAGCCTCAATCACGCCAGCCTGGGCTTCAACGAGTACTTTCCCTCCAGGCCGCACCCGGGGAGCCTGCCCTTCTCCACGGCGCCTCCCACGTTCCCCGCACTCACCCCCGGCTTCCCGGGCATCTTCCCTCCATCCTTGTACCCCCGGCCGCCTCTGCTACCTCCCACATCGCTGCTCAAGAGCCCCCTGAACCACACCCAGGACGCCAAGCTCCCCAGTCCCCTGGGGAACCCAGCCCTGCCCCTGGTCTCCGCCGTCAGCAACAGCAGCCAGGGCACGACGGCAGCTGCGGGGCCCGAGGAGAAGTTCGAGAGCCGCCTGGAGGACTCCTGTGTGGAGAAGCTGAAGACCAGGAGCAGCGACATGTCGGACGGCAGTGACTTTGAGGACGTCAACACCACCACGGGGACCGACCTGGACACGACCACGGGGACGGGCTCGGACCTGGACAGCGACGTGGACAGCGACCCTGACAAGGACAAGGGCAAGGGCAAGTCCGCCGAGGGCCAGCCCAAGTTTGGGGGCGGCTTGGCGCCCCCGGGGGCCCCGAACAGCGTGGCCGAGGTGCCTGTCTTCTATTCCCAGCACTCATTCTTCCCGCCACCCGACGAGCAGCTGCTGACTGCAACGGGCGCCGCCGGGGACTCCATCAAGGCCATCGCATCCATTGCCGAGAAGTACTTTGGCCCCGGCTTCATGGGGATGCAGGAGAAGAAGCTGGGCTCGCTCCCCTACCACTCGGCGTTCCCCTTCCAGTTCCTGCCCAACTTCCCCCACTCCCTTTACCCCTTCACGGACCGAGCCCTCGCCCACAACTTGCTGGTCAAGGCCGAGCCAAAGTCACCCCGGGACGCCCTCAAGGTGGGCGGCCCCAGTGCCGAGTGCCCCTTTGATCTCACCACCAAGCCCAAAGACGTGAAGCCCATCCTGCCCATGCCCAAGGGCCCCTCGGCCCCCGCATCCGGCGAGGAGCAGCCGCTGGACCTGAGCATCGGCAGCCGGGCCCGTGCCAGCCAAAACGGCGGCGGGCGGGAGCCCCGCAAGAACCACGTCTATGGGGAACGCAAGCTGGGCGCCGGCGAGGGGCTGCCCCAGGTGTGCCCGGCGCGGATGCCCCAGCAGCCCCCGCTCCACTACGCCAAGCCCTCGCCCTTCTTCATGGACCCCATCTACAGGGTAGAAAAGCGGAAGGTCACAGACCCCGTGGGAGCCCTGAAGGAGAAGTACCTGCGGCCGTCCCCGCTGCTCTTCCACCCCCAGATGTCAGCCATAGAGACCATGACAGAGAAGCTGGAGAGCTTTGCAGCCATGAAGGCGGACTCGGGCAGCTCCCTGCAGCCCCTCCCCCACCACCCCTTCAACTTCCGGTCCCCACCCCCAACGCTCTCCGACCCCATCCTCAGGAAGGGCAAGGAGCGATACACGTGCAGGTACTGTGGGAAGATCTTCCCCAGATCAGCCAATCTCACCAGACACCTGAGGACGCACACTGGGGAGCAGCCGTACAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACGGGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAGGTGTGCTGAGGACCACGAAGGCGGTCTGTTAGCTTTGGAGCCGATGCCGACTTTTGGGAAGGGGCTGGACCTCCGCAGAGCAGCTGAGGAAGCATTTGAAGTTAAAGATGTGCTTAATTCCACCTTAGATTCTGAGGCTTTAAAACATACACTGTGCAGGCAGGCTAAGAACCAGGCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAATCAGCCAGTGGGCAGGTGGACGCTCTGCTGAGACAGAAGCTGGTGGCCACTGCCGGGTGCCCGCGTGGGGTCGCGGAAGGGAATGGATAGACTGGTGTGCTCAAAAGAGAGAGATCACTCAAATGATTTTTATAATGAAATGACAAGAATAACCCTTTTGGTAACCGTATTGACTGCAGAGTCTATTTAAGCATGTGG +>ENST00000378389 +TGCCGGCCCCGCGGCCTGGGGGCCAGGGAGACCCAGACAACAGAGGGCAGGAGACGCCGGAGGGTCGGGCGCACCGCCTGCCCAGGGGACACGGGGCACACTCCAGGGGGATCCACCAGCCAGCCACAGAACAGTAGGAGGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCTCACGAACCACCTGGGGACCAGCGCGTCCTCTCCCACCTCAGAGTCGGACAACCACGCACTTTTAGACGAGAAAGAAGACTCTTATTTCTCGGAAATCAGAAACTTTATTGCCAATAGTGAGATGAACCAAGCATCAACGCGAACAGAGAAACGGGCGGACATGCAGATCGTGGACGGCAGTGCCCAGTGTCCAGGCCTAGCCAGTGAGAAGCAGGAGGACGTGGAGGAGGAGGACGACGATGACCTGGAGGAGGACGATGAGGACAGCCTGGCCGGGAAGTCGCAGGATGACACCGTGTCCCCCGCACCCGAGCCCCAGGCCGCCTACGAGGATGAGGAGGATGAGGAGCCAGCCGCCTCCCTGGCCGTGGGCTTTGACCACACCCGAAGGCATATGCAATGATGCTGTCCCTTTCCGAAGACACTCCTCTCCACACCCCCTCCCAGGGTTCTCTGGACGCTTGGTTGAAGGTCACTGGAGCCACGTCGGAGTCTGGAGCATTTCACCCCATCAACCACCTCTGACGGGCTGGGCAGCCGGGGGCCGGTGGCCAGAGCGAGGGCACCAGCCACGAAGGACGGAGGCGGGCGGGGCCCCGGAGAACCCTGTCCCTGCGTGTGGCCACTCCTCAGCATCCTCCCCACCCACCATGGTTCATTCCGACTTTTCCAATGGAAACTCAGATCCCAAAAGTCCCTAAAGCAGTCGTAGAGTCTCACCATCTCCAAGGATTGGTCTTGAGAACACTGTTCAGTGACGGCCATGCAGGTGGCCGTCCAAAGACAGCCAACGGAGCTGCCTCGCAGAA +>ENST00000606170 +TACAGGCGCCCACCACCACGACTGGCTGATTTTTTTGTATTTTTAGTAGAGACGGGGTTTCACCATGTCAGCCAGGATGGTCTCGATCTCCTGACCTCGTGATCCACCCGCCTTGGCCTCCCAAAGTGCTGTGATTATAGGCGTGAACCCCTGCTTCTTGAAGCCGGGGCTGTTTCTAGGGACAGCTTCCCCAGGATGCCTTTGGCTCTGCAGCTGGGAGATCCAGCAACCTCCGGGACACGGCGGGGCAAAGCTGTGCACGGGGCACGGGGCAGGGGCGCGGGCTCCCTTCCCCCCACCCTCTGTGGCCCGGCCTGCCATGCAGAGCCGGGGCCTGCACTGAGGAGCGCGTGTGCCCCTTCCAGGTGTAAGTACTGCGACCGCTCCTTCAGCATCTCTTCGAACCTCCAGCGGCACGTCCGGAACATCCACAACAAGGAGAAGCCTTTCAAGTGCCACCTGTGCAACCGCTGCTTCGGGCAGCAGACCAACCTGGACCGGCACCTCAAGAAGCACGAGCACGAGAACGCACCAGTGAGCCAGCACCCCGGGGTCCT +>ENST00000378322 +GCGCCCAGGGGTCCCGCGGGTTTTCGGGCGCAGGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTGGCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAGGTCTGGTCTTTAGAGCAGCCCGAATGGCACTGCAAAATAGACGAGGGCTCAGCCGGGCTGGTGGCCTCGTGCTGGAGCCCGGACGGGCGCCACATTCTCAACACCACGGAATTCCATCTGCGGATAACCGTCTGGTCCTTGTGCACAAAATCCGTGTCTTACATCAAATACCCGAAAGCTTGTCTGCAGGGAATCACCTTCACCAGGGACGGCCGCTACATGGCGCTGGCAGAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGCATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATATGAGATCGCCTCTGTCCCAGTCTCCTTACAGACACTGAAACCTGTTACCGACAGAGCAAACCCGAAAATCGGCATAGGAATGCTGGCATTTAGTCCTGACAGCTACTTCCTGGCGACAAGGAACGACAACATTCCCAATGCCGTCTGGGTCTGGGACATTCAGAAGCTGAGGCTGTTCGCGGTGCTCGAGCAGCTGTCCCCAGTGCGCGCATTTCAGTGGGACCCGCAGCAGCCGCGGCTGGCCATCTGCACGGGAGGCAGCAGGCTCTACCTGTGGTCCCCAGCGGGCTGCATGTCGGTGCAGGTGCCTGGGGAAGGTAAGCACATCCCCGAGGCCACGGACGTGGCAGCCTTGCTGTGTGCAGTCTGGCATCACACGGGCTGAACTGTTGAAGCCCAGCTGCTGTCTCCGGCAGCACTCCAGGGAAACTGCCCTCAGAGTCTTTGCGTAAACCTCAAGACGGACACACAGGGGACCCGCTGCCCTCAGCTTTATGGGCTAGAAGCAGCCTCTCCCTGACTTGAGGCAGCTCTGGGGCTCCACCCTGGCTCTGCCTATGTGGGTCACTCCAGGCACTGTGCTGGCCTGCAGGACAAGGGGGTGCCCATCCCCCAGAATCTGGGCCTCCCCTGCTGTAATCCTCTGGCCACCTGTCTCTCTCTAGGCGACTTTGCAGTGCTCTCTCTGTGCTGGCATTTAAGCGGAGACTCGATGGCCCTCCTCAGCAAGGATCACTTCTGCCTCTGCTTCCTGGAGACAGAGGCAGTGGTCGGCACAGCCTGCAGACAGCTGGGCGGCCACACGTAGCAGCGGTGCACTAACGTGTGCAGAAACAGGGCTACTCTGTGTTTCCAGTGTGGGAAAAAACACAGCTTCACCAGGAGGTTCTCCACTGTGGTGGTCTGGATTCAGTGATTGATTCTATTTTTCTATAGCAAAGCATTTTTGTAAATATGTATGGTATAAAACTGTAGTTTTATTATTTAAAATAAATACTTGCTGATTTATACAACTA +>ENST00000270708 +GTTGCAGCCTGCTGCGCGCCCAGGGGTCCCGCGGGTTTTCGGGCGCAGGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTGGCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAGGTCTGGTCTTTAGAGCAGCCCGAATGGCACTGCAAAATAGACGAGGGCTCAGCCGGGCTGGTGGCCTCGTGCTGGAGCCCGGACGGGCGCCACATTCTCAACACCACGGAATTCCATCTGCGGATAACCGTCTGGTCCTTGTGCACAAAATCCGTGTCTTACATCAAATACCCGAAAGCTTGTCTGCAGGGAATCACCTTCACCAGGGACGGCCGCTACATGGCGCTGGCAGAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGCATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATATGAGATCGCCTCTGTCCCAGTCTCCTTACAGACACTGAAACCTGTTACCGACAGAGCAAACCCGAAAATCGGCATAGGAATGCTGGCATTTAGTCCTGACAGCTACTTCCTGGCGACAAGGAACGACAACATTCCCAATGCCGTCTGGGTCTGGGACATTCAGAAGCTGAGGCTGTTCGCGGTGCTCGAGCAGCTGTCCCCAGTGCGCGCATTTCAGTGGGACCCGCAGCAGCCGCGGCTGGCCATCTGCACGGGAGGCAGCAGGCTCTACCTGTGGTCCCCAGCGGGCTGCATGTCGGTGCAGGTGCCTGGGGAAGGCGACTTTGCAGTGCTCTCTCTGTGCTGGCATTTAAGCGGAGACTCGATGGCCCTCCTCAGCAAGGATCACTTCTGCCTCTGCTTCCTGGAGACAGAGGCAGTGGTCGGCACAGCCTGCAGACAGCTGGGCGGCCACACGTAGCAGCGGTGCACTAACGTGTGCAGAAACAGGGCTACTCTGTGTTTCCAGTGTGGGAAAAAACACAGCTTCACCAGGAGGTTCTCCACTGTGGTGGTCTGGATTCAGTGATTGATTCTATTTTTCTATAGCAAAGCATTTTTGTAAATATGTATGGTATAAAACTGTAGTTTTATTATTTAAAATAAATACTTGCTGATTTATACAACTA +>ENST00000471223 +GTGGGAAGCAAGATGATTCCCTGGTAGGCTCCACGGGGTCTCAGTGGGAAATGCAGGTGGAGGGACACAGCAGCCCTGGAAGTCCCGCGGCGCTGCCACGGGGAGGGCTGGACCACCCACTGCGGTGCCTCTCCCTCAGCAGGCACGCCCTCGTCGGCCTGGTTAGAAAATCATCTTTTGGCCTCACTGTGCCAGCCTAGTCAGCTCTCAGCTCCCTGAGTCAGGGAAAGGGGTGGAAAAGTGGACAGTCCAGCAGCGCATGTTCTAGAACCCTCTGCAGATGCAGCCAGGCCAGCGAGCACACGCAGGAGGCAGACGGACACCTTCTTGGGTGTTGAGTGGCTGCTCCTGCCTCAGGGCTGCAGATGCAGGCTCACAGCCCCCTGGTGAGTCCCGGAGTGGCTGCATCCAATCTCCAGATCCTCTGTCTTCCCATAAAGGAGACTGAACCCGTGGTGGTTTCTAGATCAAGATTTTTCTCTGAGTAACTCAGGGTTATTATAACATGCAACCTATGGTCACTTTGAAAAAGCTAATGAAAAAGCACTTGGATTTAACTTTGTGTCACTCAATTTTGGTATAAAACAACAACAACAGAAAACCAAGAACACCAAATTTACCGTAACCACAGTAAAATACGCATTTGAATATTCCGGTAGGAGGGCAGGCATCCCCCAGGTCCTGATAGATCCACTCCAGCAGTCAGGCCTGTGCTTGGGGACGCGTGGGCGGGTTGAGGATTGAGACGGTCTCTGATGATGCTAAAGAAGTGTTTCCTTTCTCTTTCCCCTTTCCCCCAACAGCTGCGGATAACCGTCTGGTCCTTGTGCACAAAATCCGTGTCTTACATCAAATACCCGAAAGCTTGTCTGCAGGGAATCACCTTCACCAGGGACGGCCGCTACATGGCGCTGGCAGAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGGTAAGGCGTCCCCCAGACTGGAATAAAGTTGTCCTGCTGACTGTGGAGGGATCGAGTGAAGTAGATCCTTCCAGATTCCAGGGGATCTTTGGTAGGATATGGAGCAAGGTGATGTTGTATTAACAAAGGGCAGGTGCGCTGCGAATCACTTCCAGTGGCACCCGGTTGTGTGTTCAGGAGACTTGGTGAAAAGGACGCGTGCCCAGGTGTTTTAAAAGTGAATATGCTGTCACATTTGAGCCCTTTTCCTTGTCCTGTGTGATGGTGTTTGCGCATGTGTGTGCCACGTCGGGAGTTGGGGGGACGTGGAAGTTCACCTTGACTGAGGGCCTGCATTAGGCAGGGCGCTCTGCCAGGTGCCCAGGCACAGAGGGCACTGCCCCCACAGCAGACATATGAACACGATTCCAGCACAATCCATCATTAAGGTAGAGCAACCTCTGGAATGCTGTCAGAGTGCAGAACCCGGGATCCAGGCAGTGCTCTGGAAGGGACTTGTCTGAGCTGGGTCTAAAGGAGTGAGCCTGGCCAGGCAAGGAAAGGTGAGGGGGAGAGTGTGCACATGAGTGCAGGTGCGGGGAGACCAAGCCACCTTCGGGGGCTGGCCAGGCAAGGAAAGGTGAGGGGGAGAGTGTGCACACGAGTGCAGGCGCGGGGAGACCAAGCCGCCCTCGGGGGCTGGCCAGGCAAGGAAAGGTGAGGGGGAGAGTGTGCACACGAGTGCAGGCGCGGGGAGACCAAGCCGCCCTTGGGGGCTGGCCAGGCACTGACGCTGGCATCTGTGGCGGTGCAGCCCCAGCAGCAGCTCTACAGGGATTTCATGCATTTCCAGGATAGAGCTGTTGAGATTTTGTCAATTTCTATATAAGGAAATTAAGTGCGTTAAGAACATCAGTCATAAATGCAATTATTTATTTACGAAAATATTTTCCAAATTTAATGTTTCCCCCCCTTCCTTTGGAAGCATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAGGTATGAAGATGACCAGGTGACATGTTTGCTTTCGAGAGCTTTTCCCGGAATTTCATGCTTTCTGAATGCTGCAATATAGTTTGCTTTATCTTATTTCAGATAACAAGTTGAGCTTTGTTTTAAAAGACAGGGTCTTGCTCTGTCACCCAGGCTGGAGTGCAGTGGTGTGATCACGGCCCACTGCAGCCTCGACCTCCTGGACTCAAGTGATCCTCCTACCTCAGCCTCCCAAGTAGCTGGGACCACAAGCATGCACCACCACGCCCGGCTAATTTTTGTATTCTTTGTAGAGATGGGGTTTCACCGTGTTGCCCAGACTGCTCTTGAACTTCTGTGTTCAAGTGATCTGCCAGCTTCGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACAGTGCCCGGCCGAGTTGAACTTTTATCAGCGAGCCATTAGGTTGACCTCCCAATTTCCCCTTTTTCCTCATGCTCTCACTGCCTCTCCGTGACTATCTCAGTACTAGCTGGCAGTTCCAGCTTTTCCACGGCCACGCGGACAGTCCTGCCAGCTTTGTGCTATCTGCACCAATGTCACTCTGCAGCACCCGCGTCTGTGGTGTGTTCCTGGCGACGGGGGTGTATTCATTATTAACTGAAATGTCTCATCTGCAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGGGAACCAGTGCAGGGCACTCAGGAAGTCCGACCGCCCAGCGGGCCGGGCCCTGCCTCACCTGTGCATGGTTTCCTTCCTCAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTAAGTCTGGAACACGTGTTTCTGCCTGAGCAGGCTGTTGGGGAGGGCGGTGGGAAACTGCTCCTTCACTTTGCTTTCTTGATTGTGGTTTATTATTTAACCGGGCACTTCCATCACCGTAAACTTGCTACTGTGACATTTCACGCGTCTGGCCCTGCCCTGGCCTTTGTTCTTCCTCCTCCACGCTGCCCAAAGGGTCTGAAGTGGGCCTTGCCCTGGCCTGTCCTCTGCCGCTGCCACCCCAGTCCAGTTTTCTCCTTTGTGGTCTGTCTGGATGCAGATCCCTGTGCTGTACAGAGTGGCCAGGGTCTCCTGCCCCCAAACACTGGGCATCTGCTGTCGTGCCAGGCACTGTGCTCTGGGCCGCAGCCAGAGAAGAAGAGACAGACCCCTGCACTTGCAGAGTGCGGCTGGAGAGACAGGGAAGGGGCTGGAGAGCTGGGTGTCTCCACGGGGTGGCAGGGAGTGGCCACCAGCGAGGGATCGCAGGCACAGATGCTGCACCAGTGATCAGGGACTCGGGGAGGGAGCGTTCCAGGCCAAGGGAACAGGAAATGCAAAGGCCCCGAGGAGTGGGCCACGCATCCATGTGTGCAGCGGGCACTGCGCTGGGAGCCAGAGACAAATGCTGCCCTCCTGGTGTTGACCTGTAACCGACAGAGCTGAGTGAAAGGCGGCTTGGATTCGATGAAGAGGCCAGTGAGTGGCTGGGGCTGCGCATGCCAGATCAGCCACTGCCGGGGATGCATCCTGGAGGGGTGTTTAAGTGAAGACCAGGAGGAGGAGCTGCGCGGTGTCTGGGCAGAAAGGGTGTTTCAGGCAGAGGGGCCTCCTGACGTGGCCAGTGGCTTGTGTGGCTGGAGGCCAGGGTGTCTGGACAGGTGAGCCCGAGCAGGGCTGGCCACACAGGTCCTGAAGGTTTGCCTGTGATTCCTGCATTCTCCAAATCCCTTCGCCACACAGCAGCAGAGCATGCTTTAAAGGCATGAACCAGGCCAGGTGACTCCCTTACCTGGGGCTCTTCAGGGGCGTAGGGGCTGCCCGCCTTCCACTGAGCCTGGGCCGCTGTCCTTTGCTTGCCAGGCTCTCGGGCACAGATGCCCCCACCTCGGGTCTGTGTCTGCTGCTCCCGGGGCCTCTGCTGTGTTGGTGCAAGTGTTCTCTGTATCCTCTTATCACGGAGGGAAGGCTGAGCCCACTCCCTTGCTGGATGATGGTGGCTGCAGTGGTCTCCCGTCTGTAATCACAGGGCACACATTTGCTGCCTGTGTCTCAAAGGGTGGGCTCCTCAGCAGGACACGAGAGAGGGTGGCTGGGTGATCTCAGCTCTCGGGACTGCGGGGTTCGTGCTTCCGTCTCTCCCGGTGGCAGCAGGACCAGCTGTCATGGCAGGCACACCTGTTGACCATGCGCTGTCATGGGCATTTGCCACGTCCATCCTTGGCTTCCGGGTCCCTGTCCTGAGCCGGGCGTGGCCACCTTGTGTCTTTCAGGTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATGTAAGTAGCACATGTGATGTCATTTGTTTTCCTTTTTTAATGCAAGATTCCTCGTTGTCCAGATAAACTTCGGATGTTCCTTATGTTTAAAAAAAAAAACTTTTTTTCCCTTCCATGCTTCCAGCCAGTGTGCCCCTCAGCCTGTTGGCTGGAGGTTGACTAGGGTCTGAATTGCGCAGTGGGCCGTGAAGGTGCGGCTTCTGTTACTGAATATGAGCCCTGGAGACCCGGATCTGACAGCGGGAGCTCCGAGGGGATGTTTTTCCGGAGCTCCGAGAATGATGTTTTTCAAAGAAACACTTTTCCGTGGGTGGCGCTCAGAGTGGGTCTGGAACCCGGCGGTGCTCCCGAGCGCTGTCTCCGGCTTGAGGCCCGGTTCTGATGCAGCCTCTTGACTCTGGGCATTTCCTATGTGTCTGTTTCCTCATCGCTGAAATGGGCATAGTAAAAGCACCCATCCCACAGGGGCATGAGGGCATCTGAAGGTTGCAGGTAGAGGAAGCGGTGCCCCAAGTGCCGACGGGCCCACCCCGGGGCTCGGTGTGTGCTCAGGATGGGGGTCAGGACAGGTGCAGCCTGGCACACAGGAGGCGCTCCCCAGGAGCCCAGGGGCGTCCTTGTTCCACAGCCCCTGCTTCTGCTGTGATGATGGTTCTTCCACAGCCGGAAAGTCTAAGGGTACTGACGCTGAGGTGGAAGGGATTGTGAACTCAGATGCTGGTAGTCGACAGAAAAGTGCTGAGGAGTTGGAGCTGCTGAGATTGCAGCTAGGACCTGTCCATGTCCCTCTCCAGTCAGCCCCTGGCACGTGGGGTCCACCCCCCACCTAGTCGGGCCTGGCAGGTGATGGTGCCACTCTCATCCGGGGCACTTGCGGGCAGGCCCCTCGCTGCGGCTGCCAGGCTTTGCTTAGCTCTTCCTGCCCTTGGGCCGCACTTTCCTCCCCTTTGAACAGAGGAGCTGGGTTCGCGATGCCCGATGCAGGCACAGCAGCCTCTCAGCCGCGTGCGTACTTCCCGAAAGGGTGACAATGGCGTGTTCTTCCTGTTGGTGTTCTAGATGAGATCGCCTCTGTCCCAGTCTCCTTACAGACACTGAAACCTGTTACCGACAGAGCAAACCCGAAAATCGGCATAGGAATGCTGGCATTTAGTCCTGACAGCTACTTCCTGGCGACAAGGAACGGTCAGTTGTGCTGACGCAGGTGCTGTCTCACCCTTTACTGTGTCCTGTGGCCCCAGGTGTAGAAGCGACTGGAAAAGAAAATGAAGTTGGGGGTTTCCGACACGTCACCTCCTTTCACGTTTCTGCAGTAGCCGAGGTGCTCACAGAAGCTCCTTGGAGGCGCTGGGCCTTTGTCCTGCAGCAGCCGCAGGTCCGCGCATGAGTCAGGAGGCCTCCACCCTGCTCACTTGCTCCACTCTGCTGAGTAGAAAGCAGGGCTGGGCACACTGCAGCCCGCCTTTTGTTAAGGGTTTCTCCATTTGTAAAGGGCTAAAAAAAAAAAAAAAA +>ENST00000424367 +GGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTGGCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAGGTCTGGTCTTTAGAGCAGCCCGAATGGCACTGCAAAATAGACGAGGGCTCAGCCGGGCTGGTGGCCTCGTGCTGGAGCCCGGACGGGCGCCACATTCTCAACACCACGGAATTCCATCTGCGGATAACCGTCTGGTCCTTGTGCACAAAATCCGTGTCTTACATCAAATACCCGAAAGCTTGTCTGCAGGGAATCACCTTCACCAGGGACGGCCGCTACATGGCGCTGGCAGAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGCATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATATGAGATCGCCTCTGTCCCAGTCTCCTTACAGACACTGAAACCTGTTACCGACAGAGCAAACCCGAAAATCGGCATAGGAATGCTGGCATTTAGTCCTGACAGCTACTTCCTGGCGACAAGGAACG +>ENST00000497940 +GAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGCATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATGTAAGTAGCACATGTGATGTCATTTGTTTTCCTTTTTTAATGCAAGATTCCTCGTTGTCCAGATAAACTTCGGATGTTCCTTATGTTTAAAAAAAAAAACTTTTTTTCCCTTCCATGCTTCCAGCCAGTGTGCCCCTCAGCCTGTTGGCTGGAGGTTGACTAGGGTCTGAATTGCGCAGTGGGCCGTGAAGGTGCGGCTTCTGTTACTGAATATGAGCCCTGGAGACCCGGATCTGACAGCGGGAGCTCCGAGGGGATGTTTTTCCGGAGCTCCGAGAATGATGTTTTTCAAAGAAACACTTTTCCGTGGGTGGCGCTCAGAGTGGGTCTGGAACCCGGCGGTGCTCCCGAGCGCTGTCTCCGGCTTGAGGCCCGGTTCTGATGCAGCCTCTTGACTCTGGGCATTTCCTATGTGTCTGTTTCCTCATCGCTGAAATGGGCATAGTAAAAGCACCCATCCCACAGGGGCATGAGGGCATCTGAAGGTTGCAGGTAGAGGAAGCGGTGCCCCAAGTGCCGACGGGCCCACCCCGGGGCTCGGTGTGTGCTCAGGATGGGGGTCAGGACAGGTGCAGCCTGGCACACAGGAGGCGCTCCCCAGGAGCCCAGGGGCGTCCTTGTTCCACAGCCCC +>ENST00000469643 +AGTACTAGCTGGCAGTTCCAGCTTTTCCACGGCCACGCGGACAGTCCTGCCAGCTTTGTGCTATCTGCACCAATGTCACTCTGCAGCACCCGCGTCTGTGGTGTGTTCCTGGCGACGGGGGTGTATTCATTATTAACTGAAATGTCTCATCTGCAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTGGTGTATAAGGAGGCCGAGAAGAGCCCACAGCTGGGACTGGGCTGCCTCTCCTTCCCGCCGCCCCGGGCCGGGGCCGGCCCTCTCCCGAGCTCAGAGAGTAAATGTAAGTAGCACATGTGATGTCATTTGTTTTCCTTTTTTAATGCAAGATTCCTCGTTGTCCAGATAAACTTCGGATGTTCCTTATGTTT +>ENST00000494884 +CCAGCTTTTCCACGGCCACGCGGACAGTCCTGCCAGCTTTGTGCTATCTGCACCAATGTCACTCTGCAGCACCCGCGTCTGTGGTGTGTTCCTGGCGACGGGGGTGTATTCATTATTAACTGAAATGTCTCATCTGCAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCATTAATGATCCCAAGATAGTAAGTCTGGAACACGTGTTTCTGCCTGAGCAGGCTGTTGGGGAGGGCGGTGGGAAACTGCTCCTTCACTTTGCTTTCTTG +>ENST00000465916 +TCCCCGATCGCTCTCCCCTCACCTCCCAGCTTCGGAGCTGCGAGCCCAGGCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAGGTCTGGTCTTTAGAGCAGCCCGAATGGCACTGCAAAATAGACGAGGGCTCAGCCGGGCTGGTGGCCTCGTGCTGGAGCCCGGACGGGCGCCACATTCTCAACACCACGGAATTCCATCTGCGGATAACCGTCTGGTCCTTGTGCACAAAATCCGTGTCTTACATCAAATACCCGAAAGCTTGTCTGCAGGGAATCACCTTCACCAGGGACGGCCGCTACATGGCGCTGGCAGAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGCATTTTGATACGGACACCCAGGATCTCACAGGGATTGAGTGGGCCCCAAACGGCTGTGTGCTGGCAGTGTGGGACACCTGCTTGGAGTACAAGATTCTGCTGTACTCATTGGATGGCCGGTTGTTGTCCACGTACAGCGCTTACGAGTGGTCCCTGGGCATCAAGTCTGTGGCCTGGAGCCCCAGCAGTCAGTTCCTGGCAGTTGGGAGCTATGATGGAAAGGTGCGCATCCTTAATCACGTGACTTGGAAAATGATCACGGAGTTTGGGCATCCTGCAGCCA +>ENST00000419924 +GCTGCGCGCCCAGGGGTCCCGCGGGTTTTCGGGCGCAGGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTGGCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAGGTCTGGTCTTTAGAGCAGCCCGAATGGCACTGCAAAATAGACGAGGGCTCAGCCGGGCTGGTGGCCTCGTGCTGGAGCCCGGACGGGCGCCACATTCTCAACACCACGGAATTCCATCTGCGGATAACCGTCTGGTCCTTGTGCACAAAATCCGTGTCTTACATCAAATACCCGAAAGCTTGTCTGCAGGGAATCACCTTCACCAGGGACGGCCGCTACATGGCGCTGGCAGAACGGCGCGACTGCAAAGATTACGTGAGCATCTTCGTCTGCAGTGATTGGCAGCTCCTGCGGTACAAGATTCTGCTGTACTCATT +>ENST00000479331 +TGCGCGCCCAGGGGTCCCGCGGGTTTTCGGGCGCAGGGTGGCGCCCGCGGCAGGCGGCGGCCATGAACTTCTCCGAGGTATTCAAGCTCTCCAGCTTACTCTGCAAGTTCTCCCCGGACGGCAAGTACCTGGCTTCCTGTGTCCAGTACCGGTTAGTGGTCCGGGATGTGAACACCCTTCAGATCCTTCAGCTGTACACGTGCCTAGACCAGATCCAGCACATCGAGTGGTCGGCAGACTCGCTCTTCATCCTGTGCGCCATGTACAAGCGAGGGCTGGTGCAGGTGTGTGCTGCCGTGTCGCTTAGAATCTGGACACCTTCTGAGGGCCCCTGGGAAGGAGGGGTTTTGTTCTGTGCCTTTCTAGTTTGAAAAAAAAGTCCGTGCAGCTCAAAGCCAGTTTTCTTTTGAAATTATAACGTTCTCTAAAGTTTAAGAACATTTAAA +>ENST00000377837 +CGCGGGGACACTCGTGCGACTGGGGCAAGGTGCCCAGGGGCTTCTCTCCTAATTTGCCTCACGTAACAGTTGAGACCCCAGAGGGCAGCAAAACTGGGTTCGAATTGGAGAGCCGTCCAGGCACAGACAAATTCATTCATCTGCCCAGTGCCCGCTAACTGCGGTTCCAGGCGCCGGCGACGCAATTCCAGAGCTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAGAGCCTGAAGCCGCTGCTGGAGAAGCGCCGGCGCGCGCGCATCAACCAGAGCCTGAGCCAGCTTAAGGGGCTCATCCTGCCGCTGCTGGGCCGGGAGGATGCTTCTGGCTGGCACACCTGGCTTCCCCTCCATGCTCAGAACTGCTTCCTACTCTACATCCAGGCTCCTGAGCAGCCCCCAGCTTAAGCTTCAGCAGCTCCAGGGTAAATCCATCTCCGCCCAGAGCTGACTCCGGATCTGCCCCAGTGACAATAACAAGATAAATGCCTTCCATTCTCTTCGTACTTACAGGATGTAATCCACATATTTACACAGTGTTTCATTTGCGGTAATGTTTGTTTTGTTTCTTGTTCCTTCGTACCTATCTGGGAAGCCTGTGCAATTCAGATGTCCAGGCCCACTTCCAGAAGTTCTCATTCCCTGTGCTTGAGTCAATGGCCGCAGACCATACACCTGAGAGCAAGTTAATCTGCTCTAACAAAGATATCACATCTAAGAATGGTGGTTGGCAGGGGCTGGGGGGTGGGAAGAATGGGGAGTTGGTGCTTCATGGGTACAGAGATTCAGTTTTGCAAGAGGAAAAGAGCTCTGGAGATGGATGCTGCTGATGGCTACACCGCAATGTGAATGTGCATGATGCTTAAATATGGTTAAGATGGGCCGGGCGCGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAGGCGGGCAGATCACGAGGTCAGGAGATCGAGACCATCTTGGCTAACACGGTGAAACCCCATCTCTACTATAAATACAAAAAATTAGCCGGGCGTGGGGGCGGGCACCTGTGGTCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATGGCATGAACCTGGGAGGTGGAGCTTGCAGTGAGCCGAGATCACGCCACTGCACTCCAGGCTGGGCGACAGAGCGAGACTCCGTCTCAAAAAAAAAAAAAAAAAAAAAA +>ENST00000377836 +CCCGGGCCGCGCCCGGGACCTCATTTCGGACCTCGGTTTCCCTTTGCGTGGGGCTCGCAGCTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAGAGCCTGAAGCCGCTGCTGGAGAAGCGCCGGCGCGCGCGCATCAACCAGAGCCTGAGCCAGCTTAAGGGGCTCATCCTGCCGCTGCTGGGCCGGGAGGATGCTTCTGGCTGGCACACCTGGCTTCCCCTCCATGCTCAGAACTGCTTCCTACTCTACATCCAGGCTCCTGAGCAGCCCCCAGCTTAAGCTTCAGCAGCTCCAGGGTAAATCCATCTCCGCCCAGAGCTGACTCCGGATCTGCCCCAGTGACAATAACAAGATAAATGCCTTCCATTCTCTTCGTACTTACAGGATGTAATCCACATATTTACACAGTGTTTCATTTGCGGTAATGTTTGTTTTGTTTCTTGTTCCTTCGTACCTATCTGGGAAGCCTGTG +>ENST00000471190 +TGACTTGCATTGACCTGGCTCCAATCAAGCTACAACTCAAGCAGTCACGGGGAGAAGGATTGTAGATGGGCCAGTGACTCACAGGGTCAGGCACTCGGGGGAGCCTGAGTCAGGAGGATGCTTCTGGCTGGCACACCTGGCTTCCCCTCCATGCTCAGAACTGCTTCCTACTCTACATCCAGGCTCCTGAGCAGCCCCCAGCTTAAGCTTCAGCAGCTCCAGGGTAAATCCATCTCCGCCCAGAGCTGACTCCGGATCTGCCCCAGTGACAATAACAAGATAAATGCCTTCCATTCTCTTCGTACTTACAGGATGTAATCCACATATTTACACAGTGTTTCATTTGCGG +>ENST00000377834 +ACTCGTCTGGCACCAGCCCGGGCCGCGCCCGGGACCTCATTTCGGACCTCGGTTTCCCTTTGCGTGGGGCTCGCAGCTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAGAGCCTGAAGCCGCTGCTGGAGAAGCGCCGGCGCGCGCGCATCAACCAGAGCCTGAGCCAGCTTAAGGGGCTCATCCTGCCGCTGCTGGGCCGGGAGAACTCCAACTGCTCGAAGCTAGAGAAGGCAGACGTCCTGGAAATGACCGTGCGCTTCCTGCAGGAGCTGCCTGCGTCCTCATGGCCCACGGCAGCGCCCCTGCCTTGCGACAGCTACCGCGAGGGCTACAGCGCCTGTGTGGCGCGCCTGGCCCGCGTGCTGCCCGCCTGCCGTGTCCTGGAGCCCGCCGTGAGCGCGCGCCTGCTGGAGCACCTGTGGCGGAGAGCGGCCAGCGCCACCCTGGACGGCGGGCGCGCTGGGGATTCCAGTGGCCCGTCTGCCCCCGCCCCAGCGCCCGCGTCTGCCCCAGAGCCCGCATCCGCTCCGGTGCCCTCGCCGCCCTCGCCTCCCTGCGGCCCTGGCCTCTGGCGGCCGTGGTAGCCCCTCGGCCGATCCACAGACCCTGCCGACTGCTTGGGACCTTGGGGCACTGGACAGGTTGAAGCTCTTGGTGGCGGCTGCTGTTCCCATCATTAGGGGCCAGCCCAGTACCCACACCCAGGCCGGAAGCCGGCTGTTTGTGACTGGCGTGGCAGACTGAAAGCCCTGGGGCTGGGGCTCGGCTCAGGGAATAAAAGGAGCGTCCCTGCTTCACCCCCAACTTGGCTGGAGAAGAAAGGACAAGAGGCAGCAGGGTGAAGAAGAAGCCCCCCATCCCAGCTGGTGGAGATAGTTCTGGAACTGGACCCCGCAGCTGCGTGGGCAGCCGACACACCCACCCCAGCACTGGCACCAGACCAGAGCCAGAGCCAGGACCTGGGCAAAGTGCAGCCGTGCACCCTGCCTGGTCACTGCTCTCCCAGCCCTGCCTGGGCCTACCTCCTGCCCAGCTCTGCTTGGGACCCTCTGGGCATGCAGCAGCAGTAGCCTAAGGGCTCTGGTCACTTCCAGGGCTCTACAGGGCAGCAGAGCAGAGCAAAAGGGTGCATATGCTGGGAGCTGTCACCTCCACTCCTAGGCTTTTCTGCCTAGAGCAGAATTATAGGGGCAGTATACATCCAGGGGTCTGTGCGGTGGGGCTGGGGGATTCCTTAAGTGACTTTGGGAAGGATTTGTTTTCCCGAGCATCAATTTCACACCTGGGCATTGCACCCCAGGCTATGCAGTCTTTCAGTGTGAGGAAGGGGCAGAACAAGAATGAGGCGGCCCCGTGGCCTCAAGGAAGCTTGTGGCTTTGGAGGATCTGACTCCAGCAGAGTCTGTGCCAATGTGGGGTGAGCAGGGCCCCTGCCATGGAGCAGCAGGAATTTGAGGGATGGAGCAGGTTAAAGAATGGGAAACATCTTCACTTGTTTTTTTTTCTTGCAAACTACTCCCTGCTACTCATTGAGACTGGTTACTGGAAGCAACTTGTTAAGATTTTTCTTTCTGGGCGGGCGCGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCAAGGCGGGTGGATCACCTGAGGTCAGGAGTTCGAGACCAGCTTAGCCAATATGGTGAAACCCCGTCTCTACTAAAAATACAAAAATTAGCCGGGTGTGGTGGCATGTGCCAGCTACTCGGGAGGCTGAGGCAAGAGAATCACTTGAACCTCGGAGGCTGAAGTTGCAGTGAGCCAAGATTGAGCCATTGCTCTCCAGCCTGGGTGACACAGCAAGACTCTGTCTCAAAAAAAATTTTTTATTTCTTTCTTTTCCATGGAGGCCTAGAGTCCCTGTGAAGGCTAGGAAGGGGCTGCTGATCCCAGGAGTGCCCACGAGGAGTGGGGGGCACTGTTGGCCCATAATCAGGCAAACACCCATCATTTCATGGGGGATTCATGAAATCATAGTCAGGCAAACACCCGTCATTTCATGGCTAAGCATTTGCAGAAGGTGGAGGATTCTCCCCCGAGTCCCCAAATCAGCAGCCTGTGCTAGGGACCAGAGCACCGGGGGCAAGAAGACAGAACCAATGTGGGAGTGGGGATGGTCACTAAATCTGACTGTGCCACACAAGCCCATGATGACCTTGGCACTGGTTTGGGTGGCAGGATATGAAGGAAGCTGTAGGCATTATTGAAAAAATCATTGTTCAGCCAACAGGGTGAGGCTCCCAGCAAGGCCGTGCCATCTTCCCACCTCCCTGTGCCCAGAGGGTTAGACTGTAAGCTCCCGGAGGGCGAGGCTGGGGCTGAGCGTGCCTCCACGTCCCCAAGGCACAGGGTGCACAGTGGGTGCTCACTGAATATAGTGGACTAGTGAGCAGAGGATGAGAGGACTACCCTGTAATGAGCCTTGGACAGTCTGGCATTTGCCTTAACTCCCACTCCCATGCCCTGGGATCACTGTTGGATATTTACTCCATGAGGACAAATACTGGGGAGGTGTGGAGAGGAGGGAGGGCAGGTTCCTCTTACTTTCACCCATTGCTGAGAATGAGCGCCTGTTGGCACTGCCTTTGTGAGCCTCCGGGAGCAGGTAACCTGCGGCCCAAGCCCGCCTAGGACTCCACATCAGGCAGGCACAGGACTGGCCCCTTGTCCTCATAAAAACTCTCAGTACAGCTTAAACTCTGTAAGATCTAACCAGCCAGGAGGACCCTCGCTTCCTCTCCGCCATGCTTGCCACCTCTTGCTTCTGAGAGTCCATCTCAGTTCGCAGTTCTGTGACTTGCATTGACCTGGCTCCAATCAAGCTACAACTCAAGCAGTCACGGGGAGAAGGATTGTAGATGGGCCAGTGACTCACAGGGTCAGGCACTCGGGGGAGCCTGAGTCAGGAGGTCAGTGGGCCCTGGAAGGGAGGGGGCAAGCCTGGGTGGGTAAGGTTCTGGGCCCCAGGCAAGAAGGCAGAGTTTCTCCGCAGGGGTGTGTGCAAGAGCTAGCTGCGCAGAAGGTCTCCGCTGGCTCTCCAAGCCGGGCTTGTGAAATAGGAACGCCAACATCCTCCTCCACAGGCAGTGGCAGGCACCTCCTCCTCAGGTGCCCCCCAAGCCCTATCTGATGGGCAAAGGTGAACGCAGGGCGGTGGGCTTTTCCTGTGCAGAGGGAGACTGATTCAAAGGGTCATTTATGACCTTTCACAAGTCCCACATCCTGCCCAATGGCCAGGTCTTGGGATGCTGTTGCAAGATGGTTCTGTGACTCCATGTGACTGTCTGATGATTGCCCCAGCTGGGGAAAAGGCTCCCATGTCTCTTTCTCATAAAACCAGTGGGCAAGGCCGGGCGCAGTGGCTCACGTCTGTAATGCCAGCACTTCGGGAGACCAAGGTGGGCGGATCACCTGAGGTCAGGAGTTCAAGACCAGCCTGACCAACATGGTGAAACCCCGTCTCTACAAAAATATGGAAATTAGCTGGGCATGACGGCGGGTGCCTGTAACCCCAGCTACTTGGGAGGCTGAGGAGGGATAATCAGTTGAACCCAGGAGGTGGAGGTTGCAGTGAGCCGAGATCGCGCCACTGCACTCCAGCCTGGGTGACAGAGCAAGACTCCATCTCAAAAACAAACAAACAAAAAACTAGCGGGTGAAATGATTCAGTGACCTAAGGACAGCCAGAGCACTAAGCTGCTGGGAACCCATCTGTGCTGAAATGTAGATTTCCCAGGAAACTCAGGCTTGGGACAGGCGCCTACCTGCTCCTCGGGCACCAGGTGATTAGGAGAGGTCGAATCTCATTTCCACGTGAGTGAGGATAAAGACTGGGCTGCCAAGGAGGACTCCTCATAAACATTGACAAATTGCTCTGCCCCGCCTGTGATCCCAGACGACTCCTGCAGTCTGGGATCCTGAGTGTCCTGTGGGTTCATCTCGGATGGGCGCTGCATAAACAGCCTGCAGGGAACGTCTGGGAGAACCAGCTTCACAACAGATATAATAAGGAAGAAGTTTGAAATATTGCAAGAATTGCGAAAGTGTGACACACAGATACAAAGTGGGCACATGCTCGTGGGAAAATGTTGCCAATAGACTTGCTTGACTCTGGAGTTACCCCGAACCTTCAATTTGTTTAAAAAAAAAAAAAGGCAATATCTTGACGTGCAATAAAGTGAACTGCAATAAAA +>ENST00000487437 +CCAGCCCGGGCCGCGCCCGGGACCTCATTTCGGACCTCGGTTTCCCTTTGCGTGGGGCTCGCAGCTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAGAGCCTGAAGCCGCTGCTGGAGAAGCGCCGGCGCGCGCGCATCAACCAGAGCCTGAGCCAGCTTAAGGGGCTCATCCTGCCGCTGCTGGGCCGGGAGTGCCTTGCGACAGCTACCGCGAGGGCTACAGCGCCTGTGTGGCGCGCCTGGCCCGCGTGCTGCCCGCCTGCCGTGTCCTGGAGCCCGCCGTGAGCGCGCGCCTGCTGGAGCACCTGTGGCGGAGAGCGGCCAGCGCCACCCTGGACGGCGGGCGCGCTGGGGATTCCAGTGGCCCGTCTGCCCCCGCCCCAGCGCCCGCGTCTGCCCCAGAGCCCGCATCCGCTCCGGTGCCCTCGCCGCCCTCGCCTCCCTGCGGCCCTGGCCTCTGGCGGCCGTGGTAGCCCCTCGGCCGATCCACAGACCCTGCCGACTGCTTGGGACCTTGGGGCACTGGACAGGTTGAAGCTCTTGGTGGCGGCTGCTGTTCCCATCATTAGGGGCCAGCCCAGTACCCACACCCAGGCCGGAAGCCGGCTGTTTGTGACTGGCGTGGCAGACTGAAAGCCCTGGGGCTGGGGCTCGGCTCAGGGAATAAAAGGAGCGTCCCTGCTTCACCCCCAACTTGGCTGGAGAAGAAAGGACAAGAGGCAGCAGGGTGAAGAAGAAGCCCCCCATCCCAGCTGGTGGAGATAGTTCTGGAACTGGACCCCGCAGCTGCGTGGGCAGCCGACACACCCACCCCAGCACTGGCACCAGACCAGAGCCAGAGCCAGGACCTGGGCAAAGTGCAGCCGTGCACCCTGCCTGGTCACTGCTCTCCCAGCCCTGCCTGGGCCTACCTCCTGCCCAGCTCTGCTTGG +>ENST00000489730 +TCGTCTGGCACCAGCCCGGGCCGCGCCCGGGACCTCATTTCGGACCTCGGTTTCCCTTTGCGTGGGGCTCGCAGCTGCCACCGCTTCCCCGCGGAGCATGGGGCTGCCTCGCCGGGCAGGGGACGCGGCGGAGCTGCGCAAGAGCCTGAAGCCGCTGCTGGAGAAGCGCCGGCGCGCGCGCATCAACCAGAGCCTGAGCCAGCTTAAGGGGCTCATCCTGCCGCTGCTGGGCCGGGAGAACTCCAACTGCTCGAAGCTAGAGAAGGCAGACGTCCTGGAAATGACCGTGCGCTTCCTGCAGGAGCTGCCTGCGTCCTCATGGCCCACGGCAGCGCCCCGTGAGTGAGCCCTCCCTGCCCTGCCGCGCGCTCTGCACCCCGCACCCGGCACCCTACCCCGCGCCTCACGCGGCTCTCCGCCCGCAGTGCCTTGCGACAGCTACCGCGAGGGCTACAGCGCCTGTGTGGCGCGCCTGGCCCGCGTGCTGCCCGCCTGCCGTGTCCTGGAGCCCGCCGTGAGCGCGCGCCTGCTGGAGCACCTGTGGCGGAGAGCGGCCAGCGCCACCCTGGACGGCGGGCGCGCTGGGGATTCCAGTGGCCCGTCTGCCCCCGCCCCAGCGCCCGCGTCTGCCCCAGAGCCCGCATCCGCTCCGGTGCCCTCGCCGCCCTCGCCTCCCTGCGGCCCTGGCCTCTGGCGGCCGTGGTAGCCCCTCGGCCGATCCACAGACCCT +>ENST00000635687 +GACCCCTCCCCCGCACCGACGTGATTCGGATCGCGCGGTGCTGGCGCCGCCTTCATGCGCCCTGCCTGGCCCCCACCTGGTCCTCTTTCCTTTTCAGGTGGAGGAGATGCCGCTGTCCCGTCGGTCTGGGGACAGCCCAGCTCCCCGGATCCCGGGCTGGAGAGACGCGTCGCGGCCCCGGGGCCTGGTGGCACGAGCAGGAAGGAGGACCCGGCGGCGGGCTCTGCCTGGGCTTGCCTGGGCTTGTTCCGAGCCGGGCTGCTTCTCGGTGACCACGCAGATCGGGGGCATTTGGAGATTTTGCGGGAGTCCTGCAGCCAAGCTCCGGGGCAGGAGAGGCCTGGAAGCCTGCACTACCTGCTCGCCCCGTCCCAGCATGCACCCAGGTGCTGGGGAGAGGCAGGACAGGCCTGTCCCCCGAGTCCCCTCCGGATGCCGTGGACCGGCCAGCTGTGAGTGTTTCTTTGGCAGTGTCTTAGCTGGTTGTTGTGAGCAATAGTAAGGAAGCAATCAGCAAGTATACTGCCCTAGAAGTGCTGCACGTTGTGGGGCCCAAGAGGGAAGATGAAGCGAGAGATGCCCAGACCAGTGGGAGACGCCAGGACTTCGGAAGCTCTTCTGCGCCACGGTGGGTGGTGAGGGCGGCTGGGAAAGTGAGCTCCAGGGCCCCAGGAGCAGCCTGCTCGTGGGTGCGGAAGGAAAAAGGCACAGGGGCTTGGTGTGGGCGGCTTTTGGCTGGGAGAAGTTTGCACGTAGGGAGAATAGTAGCCAGTGTTTGCAGAGCACTTACTATGCAGGAAGGCCTGTCCTAAGTATTGTAAGTGTATTACATCATGTACAAGTGTCTGTGATTAACCCCGTCTTGCAGAGAAGGAAACAAAAGTACAAACAGAAAATGTAACTAAGCATGCAATTAATAAAAAGGGACCAGGTTTTGAACGCGAGCAATCTGGCTCAAGAATCTGCGCCCAACCACCGGCTCCTGTTCTTAGAGATGAACGTGGAGTCCTGGAGACTGCTCAACATTGTGACTTGACTGTGAGCGTACGCGCTCCCTGTCCCCAGGAGACAGATTTCCAGTGCAATCATAGAAAGTGCCTGTGTGGGCTTCGGGAGATGTGTCTGCCTTGGGGAGAATTTTCCTTTTCAGCTAGAGCCAGGCCCAGGATGTTGACGTCAGTGAGACGCTGGTGACGTTCTCTGCTCCAGTGGCTGATGAGAAAAGTTCCTCCAAGCCAGCTCAGTTGAGAAGAATTAAGTTCTCTGGGTCCCACTGGCTTCACCTACAGATGCCAACTTTGAGGCCAGTGAACTGTGAGGCCAGCTGGGCTGATTGCCATGGCAACAGGAATTGGACCAAAGTCACCGGAGGATGGAGAGGGAAGACACAGTGGTGGCTTCCCCAGGTCTTGGACCACAAGGCACAGCCGTGGCCTCCAGGAACCCTGAGATAACCCGTTAGTGGGTCCTGCACTCCAACAGAGCTCATGCAATCAGCCTCTGGTCCTCACCCTCCTCCCATTGGTGTCGTTGTGCTCTCTAACATTGACATTGAGCAGTGAGTGCTCCAGATCTTGTTCCACTGATTTTTTCCACTGTTCTCCAGTCTAGCACTTTCTGAAATTCATCCAAGCCTAAGAGGTGACGCCAAACGTAAGTGTCTTACACCTCGGACCCCATGGACTAAGACAAGCCTCTGGGGTCCATGTGGCACCAAGGATGGGGCCTTCTAGTACCTTTCACACAGGCCAGGGACAGCACCTGCTGCGACCCCCACCCCCAGCCTCTGCTGCTTCTCCCGTTGCCCTTCCAGCCACTGCCCTGGGCACCTCCCCTGCTCCCGCCTCCCTGCCTGGGCCCATCTTTCTTTGCACCTCACCAATTGCGGGGCTTCCTAGTGCTGGAGGGGAAGGGAGCCTGCTTCCATTCTCACCACTCTGAAAGAAGACCCTGCAGAGAGGTTTTCTGGAATTTGGAGCCTAACCTTGGCCTTGACACAGTCCAGATGAGAAGGCCGTCCCCCAGTTAAGCCAGCCCTCCCTCCCTCTCAATGCTGGAGAGGAAACCAGGCAGCTGGTTGCTTCAGCAAACCCCCTCCCTATGGGAATTGTCCTTTTCTTCCTCAAATAGACTGGAGTGCAGAGGACTTGCTTCAGAGAGAGCCCCTTTGTAACGCACATTGCACGGGCCGTGCCCCATGCCCACTCTGCCACAAACTCCCCTCAGCTGCCCAGCCCCGTGGAGCCAGGCGTGGGCTGAAGTGGGGCCAATGAAATGCCTGGAATGCCAGCCGCAGTGACAGGCCAGCACTCAGATGCCTCTCGGGAGTTCTGACCGAAGCAGCACTGAGGACTGCTTCAGAGCAGAAGTCTACGCCATTTTCCCCAGTTCTAGGCAGAAGTAAAGAATGTCTCTACCTTCTCCCAACCAGCAATTGATTCAGAGTCCTGAGCTTTTAAATTAAAGGGACCCCTCTGTTGCTTTATGCAGTAGCCAGCTTATTCATTTGAGTTCAGGTGAAATCATTTTCAAGTAACCTCTTCCTATCCAGCTTTACTTTTAGTTATGCTGACATAAAAACAATAAAAATTGTCCTCCTCAGAGTTCACCTGTAAAAGTTCCTGGATAATTAGTAAGGAAACAGAAAGAGCAGATAGTTGTTGCTTCAGATAAAAGTGATGTCTGGGTTGGGCACGGTGGCGCATGCCTGTAATCCCAGCACTTGGGGAGGCCCAGGTGGATGGATCCCTTGAGCTCAGGAGTTTCAGACCAGCCTGGGCAACATCTCTACAAAAAATACAAAAATTAGCCAGGCATAGTGGCAGGACTGTAGTCCCAGCTACTCAGGAGGCTGAGGTCAGGGGATGGCTTGAGCCCAGGAGGCACAGATTGAAGTGAGCTGAGATTGCGCCACTGTATTCCAGCCTAGGTGACAGAGCCAGACCCTGTCTCAAATTAAAAAAAACTCTTTGTGGTCATTTAATTTACTTCTGCATTCTTTTTTTTTTTTTTTTGAAATGGGCAGTGGTACCATCTCAGCTCACTGCAACCTCTGCCTTGGGGGTTCAAGTGATTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGATTACAGGCACCCGCCACCACGCCCAGCTAATTTTTGTATTTTTAGTAGAGACGGGGCTTTGCCATGTTGACCAGGCTGGACTCAAACTCCTGACCTCAGGTGATCCGCCCACCTCGGCCTCCCAAAGCACTGGGATTACAGGAATGAGCCACTGCACTCGGCCTACTTCTGCATTCCTTAGAGTACATCCTAGCTAGGATATATTCACTTGTCTTTAGAGCTAACAGCAGAAGAAAGGTACCTAGATGCTTATCTAGCTCTTTATCTTTCTAGAAATTCTAGAAGATGAGAGGGGCAGTGGTGGCTCCAAGGGAGTGATTTTAGGATGGACTGGGACAGAGAGGGGCTGCTTACACATACTCACACAGAGGCCATTAATTTAGGGAGTTCAAGGTCCAGGAGGTTGACGGCATCTAGGCCTGTGGCAGAGTGCACTCCTGCTTTGGGGAATGTATGGGCAGCTTCTTGCCTGTAGTTGGAGGGTTAGAGAGAGGGATCAATAATTTCATGGTTGGACTTGAGTTTGGAGCGAGTGGAGTTAGATACAAATTCTATGTTTTTGGAGAAAGTATTTGATCTTCTTGGCTGTGAGGCAAAGCGAGGTTTAAAAATATTTTTCACTTAAAAATATATATATATGCATGTATATTTAATACTGTCTATGGATTGTGCCAATATCTATTTCATGGTTTTGATATTGTGTAGTTATACAAGGAGTTACCACTGAACGAAACTGGGGGAAGGGTACACAGAATCTCTGTACTTTTTTTGTTGTTGTTGCAATTTCCTGTAAATCTATGATTATTTTAAAATAAAAAAGTTAAAGCATACGTATTTACATTTGATTAAATGCAGTGTGATATCCTGGGTTGGATTTTGGAACAAAACAAGGCATGAGTGAAAAAACTGGTAAAATCCAAAAAAGCCTTTAGTTAAAAGTAATACCAGTGTTAATTTCTTAGTTTTGACAAATGTGCCATGGCTGTGTAAGATGCAAATGTTAGAGGAAACTGGGCGAAGAATTTGAGGGAACTCTCTGTACTATTCTTTGCAGCTTTTCTGTAAATCTACAATTATTCCAAAATAAAAGTCTATTAAAAATGTAA +>ENST00000385130 +GGCCAGCTGTGAGTGTTTCTTTGGCAGTGTCTTAGCTGGTTGTTGTGAGCAATAGTAAGGAAGCAATCAGCAAGTATACTGCCCTAGAAGTGCTGCACGTTGTGGGGCCC +>ENST00000635405 +TTCATTGGAGTTGAGGGCTCGGAGCAGCAGGCAGCCTTCCCCGTGGGAAGGATGACAAATGGGGAGTGCTGCTTCTAGGTGCTCGTACCAACTGGCTTCGTGCGTCCTGGGATGGGCGGTGTTCACAGGCGCTTCGGGGCTGAGCGCCCACCAAGTGTGGCGCGCGCTTTTGGGAAACTCCGTGGAAGACCAGGACGGACCCCTGGAGGGTTAGGAAGACTTTGAGACCAGCCAGGGGAAGCCGTGTCCCGGGCCCTGACTGTGGATCTCCTACTCTGAACCACGGACTCCAGTTTGGAAGGCCAGGCTGCCTTTCGGATTGGGGGGTAAGGAAGGGATCCCCAGCTCAGGCAGCCTTTTGGGCTAGGGCAAGGGGACCTCTGGAACCACATTTTTGAATGCTCCCACCCATGATTTCTGGGACAGCTACTGGAGACAAATAGAGGCTCGAAGGTGTCGGGAGAAAGGCTGTGTTCCTGATGTCATGTAGTTGAACTTGGATGTGGAGGAAGTCCAGCTTCCCCTGCAGAGTAAAACCAAGCCAGCGAATGTGGGTGGGGGCCAGCAGCTGCCGACCCTCCTGGGTGATGTGATGGGCTTAGGTGGTAGGAGCCAGGGGCCTGGGGCCAGAGAGGGCAGCCCTAAGGGGGTCTAGACAGCACCTTCTGCCCAGAATGGCAGCCTTTGGTACAAGTCTTTATTTATGCCAGTGGCATGAAAATGTCGCCCGATGAATCCCCAGGGGCCCGTTCTTGGCAAAAGCCCTGTCTCCCAGCAAGATGGGAAGTGATGTCACATTGCACTCTCCAGCCCGCTCTTCTGGGGTTGTTCGAGTTGTGAGATGGTTCGGTGACTGATGCCTCTCATTGTCCCAGACCTTGTGCTTCCCCTGGGAGACCCTCCACCCTGGTGGTTGCTTTTTCCTGTCCCCATGCTTTAGCTTGAGCATCTCCACCGTGGAGGCTGCCCTTGGAGGCTGCACTGTGCTGGGAGGAGAGGGAGACTGGAGAGGGAGAGGAGGAGGAGATGGCAGGGGCAGTGGGGCCCTCAGAGCTGGTGCAGTACTGTGCTGATGTCATCACTTTTGGGGGCCTGCTGAGGCCTGTGGCTGCTCCAGAATCGACACCAGGAGCCTCTTGCTCAGCCTGGGACAGGCACAGCATTGCGGCTGCCAGTCTCCCTGACAAGGACAAGACCTGCACCTTCCAGGCAGAGCCAACTGGCCAGCTGAGGTCCTGCGACTCCTGCAGGGATGAAGGTATAAGGAAAAGGTGAGGGCCACGAGAACCGGCAATGGGACGCTGGCGGGGCTCACCTGGCAAATTGGCAGCACCAGACTCCGGAAGAGAGGGAGCAGAAGGGAGGCAGGCCGGGGACTGCAGAGAAAGGCGCCAAGGCACTGGCAAGATCCTAGCGCCTCAGATCCTGACCGTGGCACCTCCCCACCGACCATTTTCACTTTTCACCCAATGCAGTCGGTAGTTTGCTCTGCGCTTCTCATTCTCAGCAGTTCTGATTAAAGATCAGATCCCATTTTCCTTTTATGCCTTTAAACTTTAAGCCTGGCCACCCAAGACAAATGCTCTATTCAAAGCTGGAAGATACTTAGAAATCATCTGTTACAAGTCCCCAAGCTCAGCGATGAGGACAGTGAGGCCCAGAGATTAACCGACTTTCCCAAGGACACAGGAAGCTCAGGGCAGACCTGGGATTCCCTGGGACATGTGGGACACGGATGAGATCATCAGCGCTCAACCCATCAGGCATCCTGACTCAGATGCAGTAGGACAAGGTGGAGGAGATGCCGCTGTCCCGTCGGTCTGGGGACAGCCCAGCTCCCCGGATCCCGGGCTGGAGAGACGCGTCGCGGCCCCGGGGCCTGGTGGCACGAGCAGGAAGGAGGACCCGGCGGCGGGCTCTGCCTGGGCTTGCCTGGGCTTGTTCCGAGCCGGGCTGCTTCTCGGTGACCACGCAGATCGGGGGCATTTGGAGATTTTGCGGGAGTCCTGCAGCCAAGCTCCGGGGCAGGAGAGGCCTGGAAGCCTGCACTACCTGCTCGCCCCGTCCCAGCATGCACCCAGGTAAACGCTTGTGTTTCTCAGTCCGTGCGAAAGTTTGCAAAGAAGGAGGCGGGAACTAGACCAACAACTTTAATAATCATAGTCATAATAATGAAAACCCTGTTCAATTGTGTAGCCTCCGTAAGGGGAAGAATTTCCAAGAAGCAACAAAATGTTCTTTGATTTCATAATCTCTGGGGAGAAAGGATTCCTTTTTTGGGGTTTTGCTCGGCTAGTTCTTTCTTCCCTCCTCTATCTCCAGCGTGGGGCGAGGAAGGCCGACTGGTTCATGGGTGGCAAATGGGGACCCTGGCTCTCTTGCGCTGCTGGCCACGGTGATATTGCAGCAAATGCTCAACCTCCCCAGTTCCTCTCCTCACCTTGAAAGTGGAGGCATTGATACTAGCCACCCATGGTTGCAAAAAACTCGCATGAAAGGGAAAGGAAAAGTGCTTCGGTCACTAAAGTAGCGTTGTCTAAGAGGTCAAGGCTTTGGAAGACTTTTGCTCTAGAAGAGGGGAACGGGAGAGGGGCTTTCAGCCAACCTGGCCCCGAGGTGAACGCGCGCGCCCCCTGCTGGCTGGAGCCCTGTCCAGCCTGTGAGCCGCCAGTGGGGAAGGAGACTGAGGGGAGGTGGTCCCTGGAGTTCCTTGCTCCTGGCCTGGAGCAGCAGGTGCCAGTGCTCCTGAGGCCCCCTCTCTCAGGTTACGTGGATGGGGCCTGTAGCACAGACAGGGCACATGCTTCAGCACCTCCCTGTTTCTGCGTCAGGTGGGGGACATGAGCTAGGCTCTGCAGAAGGTTCCAGAGCCTGGGCCTTCCTGTTGCATCCACACTAGGCTCCTGGAGCCCAGAGGTGGCTGGGATCTCTGCATACATGCATGTGAAACTCTAGCAGATACCAAGTCATGTTAAGGGGGCTAAACGGCCCACTGCAGTTATGTTAGCCAGTTCTGCCTCTGCCCAGTTCTGAGATATCTTTGGGACAAATGGCCACTCCTCTGAGCCCCTGTGTCTTCCTGCATGAGCCACAAATGCTGTGTAGTCATGGCTGAGGAAGAGGGAAGGTACCTGTGCTTGCAAACATTCCTCTTGAAGGACTATCCAGGAGCAGAGGGAGCAGCTGGGGGCAGCATCAGTTGGTACCTGAGCCCATTGGCACCTACTGCCACATGGGGTAGTGGCCTGTCTCCTGAGCTTCCCCAAGCTGGCCAAAACTGGCCAGGACTGCCCTGCTCTCCCCTCCCAATCCAGCTTTCTCTTGGGCCTCCAGGATCCCTTGGCTAGCTGGTGTGGTGGCCATGAGGACTGCACTTTTGCACCCCACCCCTGCCCTTGGCACACATCGCAAATCAATAATGCTAAACCTAGACAGGCCCCCAGGTCTTTCTGATCATAGCATCCATGCAGTGCTTCCCATTGATTGTGTCACCTAATTGCCAACCCAGCCCTACACCTGCCCTTGTAACTGGTCCCTGGGCCGGGGGGTGTAGGAGGATGCAAGGATGAACAAGATGCTGCCCTTGGTTATAGGATACACTACCTCCAGCTAGAGGTTATCAGATCTGTGCATAAGAAAATAACTAGGCGGGACTCATTCATTCATGCGACAAATATTTACAGAGTCCTTGCTATACGCAATGAGTCATTGAGGAGAAACCTACAGAAGGATGAGGGGGACGGCTTTTCAGGCAGAAGGGTTAGTAAGTGCAAAGGCCCTGTGTTTGGTGCATTGGAGAAATTGCAAGAAAGCGGGTGAGACTGAAGATCAACTCGTGATACTTGGTAATGAATATCACATGAAAACAAGGAAGTTTTCTTGTCTAGCTCTGAAATTTGCCTTGGTTGGCAGATCCTTCCTTCCCAGAGAGCACACATCAGTACTGCAGCTACAGCTGTCTGTCTGACATACTTGTAAGAACGAACTGTTTAGTGCAGGCTCTGGGAGGCAGTGCCATGCGGGTCACTGACATACATGGTGCCAATCATTTTTCTCCATTCGTAAGGCACCTCAGGACCCCACTGGGGCCCCAGTGTTCCAGTAAGGATACGGGTTTTGAGTTAAGGACCCGCCTTCCAGCTCCGTCTCTGTCACTAGCTGTGCTAATTTGGAAATAGGACTTCCTTTCCTGGCTTTGGTTCCTCATCTATAAAAATTGCCCTTATGTTAGGACCTACTTGGTAGACGCATGAGATAAAATAATTCGAGAATGTGCATAAACCAGGGAGCAGGGTGCTGTGGCAACTATTAGGTAGCATCAGTGATAAAGCACTTTGCTTTCATGGATATTTTATGTGTTCACTAAATCAGAACTTTCCTCTATGCTGATGTAGTCTAGTGAGGTCTGGGGAGTTTCTTGTTTGATTTTGCATTGCAAATATTCCTCTCTTCCCCTC +>ENST00000437157 +GAGGAATGAGTCCCCCGTTCTCACCCCGGGGAGCGGTTGCCTCGTGAGTCCAAGGAGAATCCGCCCTTTCGTTTTGCGCAGGTGGAGATCTCGCGGGCCCAGTTCGGAGTCCTGCAAACTGTGGAGGAGATGCCGCTGTCCCGTCGGTCTGGGGACAGCCCAGCTCCCCGGATCCCGGGCTGGAGAGACGCGTCGCGGCCCCGGGGCCTGGTGGCACGAGCAGGAAGGAGGACCCGGCGGCGGGCTCTGCCTGGGCTTGCCTGGGCTTGTTCCGAGCCGGGCTGCTTCTCGGTGACCACGCAGATCGGGGGCATTTGGAGATTTTGCGGGAGTCCTGCAGCCAAGCTCCGGGGCAGGAGAGGCCTGGAAGCCTGCACTACCTGCTCGCCCCGTCCCAGCATGCACCCAG diff --git a/pygtftk/data/mini_real_10M/expected_size.txt b/pygtftk/data/mini_real_10M/expected_size.txt new file mode 100644 index 00000000..3cf94617 --- /dev/null +++ b/pygtftk/data/mini_real_10M/expected_size.txt @@ -0,0 +1,68 @@ +ENST00000624697 788 +ENST00000624652 657 +ENST00000379389 711 +ENST00000338370 1072 +ENST00000338338 1047 +ENST00000321751 798 +ENST00000378853 875 +ENST00000489799 695 +ENST00000496905 608 +ENST00000378602 1118 +ENST00000310991 929 +ENST00000378598 483 +ENST00000470931 690 +ENST00000602604 878 +ENST00000416272 313 +ENST00000400919 1413 +ENST00000469733 2280 +ENST00000414253 2216 +ENST00000428120 2313 +ENST00000400918 811 +ENST00000497675 4478 +ENST00000378546 729 +ENST00000378543 569 +ENST00000401813 2543 +ENST00000487186 3576 +ENST00000476803 701 +ENST00000440825 855 +ENST00000420515 1544 +ENST00000514625 703 +ENST00000420964 314 +ENST00000609981 568 +ENST00000449969 5450 +ENST00000419816 4837 +ENST00000378486 4837 +ENST00000343889 6453 +ENST00000278878 3781 +ENST00000473964 6986 +ENST00000462379 2341 +ENST00000511072 4282 +ENST00000607632 581 +ENST00000378391 5447 +ENST00000514189 4236 +ENST00000270722 8690 +ENST00000512462 3723 +ENST00000463591 384 +ENST00000509860 3737 +ENST00000378389 1142 +ENST00000606170 557 +ENST00000378322 1998 +ENST00000270708 1665 +ENST00000471223 6089 +ENST00000424367 940 +ENST00000497940 1101 +ENST00000469643 563 +ENST00000494884 433 +ENST00000465916 779 +ENST00000419924 603 +ENST00000479331 446 +ENST00000377837 1222 +ENST00000377836 507 +ENST00000471190 349 +ENST00000377834 4262 +ENST00000487437 968 +ENST00000489730 730 +ENST00000635687 4211 +ENST00000385130 110 +ENST00000635405 529 +ENST00000437157 409 diff --git a/pygtftk/data/mini_real_10M/ids.txt b/pygtftk/data/mini_real_10M/ids.txt new file mode 100644 index 00000000..f78703ae --- /dev/null +++ b/pygtftk/data/mini_real_10M/ids.txt @@ -0,0 +1,68 @@ +ENST00000624697 +ENST00000624652 +ENST00000379389 +ENST00000338370 +ENST00000338338 +ENST00000321751 +ENST00000378853 +ENST00000489799 +ENST00000496905 +ENST00000378602 +ENST00000310991 +ENST00000378598 +ENST00000470931 +ENST00000602604 +ENST00000416272 +ENST00000400919 +ENST00000469733 +ENST00000414253 +ENST00000428120 +ENST00000400918 +ENST00000497675 +ENST00000378546 +ENST00000378543 +ENST00000401813 +ENST00000487186 +ENST00000476803 +ENST00000440825 +ENST00000420515 +ENST00000514625 +ENST00000420964 +ENST00000609981 +ENST00000449969 +ENST00000419816 +ENST00000378486 +ENST00000343889 +ENST00000278878 +ENST00000473964 +ENST00000462379 +ENST00000511072 +ENST00000607632 +ENST00000378391 +ENST00000514189 +ENST00000270722 +ENST00000512462 +ENST00000463591 +ENST00000509860 +ENST00000378389 +ENST00000606170 +ENST00000378322 +ENST00000270708 +ENST00000471223 +ENST00000424367 +ENST00000497940 +ENST00000469643 +ENST00000494884 +ENST00000465916 +ENST00000419924 +ENST00000479331 +ENST00000377837 +ENST00000377836 +ENST00000471190 +ENST00000377834 +ENST00000487437 +ENST00000489730 +ENST00000635687 +ENST00000385130 +ENST00000635405 +ENST00000437157 diff --git a/pygtftk/data/mini_real_10M/ids_exon_minus.txt b/pygtftk/data/mini_real_10M/ids_exon_minus.txt new file mode 100644 index 00000000..6fdda33e --- /dev/null +++ b/pygtftk/data/mini_real_10M/ids_exon_minus.txt @@ -0,0 +1,135 @@ +ENSE00001611509 +ENSE00001790281 +ENSE00001842703 +ENSE00001629775 +ENSE00001922199 +ENSE00001821535 +ENSE00001789693 +ENSE00001896016 +ENSE00001223521 +ENSE00001921648 +ENSE00001479025 +ENSE00001479027 +ENSE00001697866 +ENSE00001478064 +ENSE00001754010 +ENSE00001478051 +ENSE00001810932 +ENSE00003350147 +ENSE00003428438 +ENSE00003652520 +ENSE00003675447 +ENSE00001858191 +ENSE00001682091 +ENSE00003599669 +ENSE00003634508 +ENSE00001937932 +ENSE00001767147 +ENSE00001736550 +ENSE00003473336 +ENSE00003561172 +ENSE00003343061 +ENSE00003293243 +ENSE00001239803 +ENSE00003475992 +ENSE00001817609 +ENSE00003589214 +ENSE00001635485 +ENSE00003459358 +ENSE00003626371 +ENSE00003526713 +ENSE00001862783 +ENSE00003569320 +ENSE00003681657 +ENSE00003483048 +ENSE00001951400 +ENSE00002033745 +ENSE00003636009 +ENSE00003529933 +ENSE00001602311 +ENSE00001720216 +ENSE00003630334 +ENSE00003481862 +ENSE00003510741 +ENSE00003548540 +ENSE00003634783 +ENSE00003467961 +ENSE00001841545 +ENSE00001816369 +ENSE00003618179 +ENSE00001545345 +ENSE00001822711 +ENSE00002226200 +ENSE00001477870 +ENSE00001816144 +ENSE00001720995 +ENSE00002040955 +ENSE00003615416 +ENSE00002044438 +ENSE00001853635 +ENSE00001859055 +ENSE00002034769 +ENSE00001916683 +ENSE00001937728 +ENSE00001845014 +ENSE00001908868 +ENSE00001934415 +ENSE00001714381 +ENSE00001821386 +ENSE00001724829 +ENSE00001927358 +ENSE00001755234 +ENSE00001697450 +ENSE00001797222 +ENSE00001862304 +ENSE00003789737 +ENSE00001852362 +ENSE00001924010 +ENSE00001659258 +ENSE00001813324 +ENSE00003685083 +ENSE00003653006 +ENSE00001866903 +ENSE00003492457 +ENSE00001896684 +ENSE00003669982 +ENSE00001839399 +ENSE00003387437 +ENSE00003480267 +ENSE00003485438 +ENSE00001857368 +ENSE00000734306 +ENSE00000734303 +ENSE00001854631 +ENSE00000734299 +ENSE00001931622 +ENSE00003566716 +ENSE00003677298 +ENSE00001870155 +ENSE00001477063 +ENSE00001680820 +ENSE00001748742 +ENSE00001836154 +ENSE00001858739 +ENSE00001475277 +ENSE00001475269 +ENSE00001890428 +ENSE00001475263 +ENSE00001948071 +ENSE00001854189 +ENSE00001914446 +ENSE00000734533 +ENSE00002817476 +ENSE00001916716 +ENSE00001475267 +ENSE00001475271 +ENSE00001835288 +ENSE00001475281 +ENSE00001150483 +ENSE00003790229 +ENSE00001500136 +ENSE00003791526 +ENSE00003787977 +ENSE00001658885 +ENSE00001670416 +ENSE00003784444 diff --git a/pygtftk/data/mini_real_10M/ids_exon_plus.txt b/pygtftk/data/mini_real_10M/ids_exon_plus.txt new file mode 100644 index 00000000..1599db3b --- /dev/null +++ b/pygtftk/data/mini_real_10M/ids_exon_plus.txt @@ -0,0 +1,112 @@ +ENSE00003759395 +ENSE00003755319 +ENSE00003755395 +ENSE00001480807 +ENSE00001480799 +ENSE00003756535 +ENSE00003760003 +ENSE00001648978 +ENSE00001621165 +ENSE00001780479 +ENSE00003473982 +ENSE00003499259 +ENSE00001477669 +ENSE00001477672 +ENSE00001400676 +ENSE00001477687 +ENSE00001376863 +ENSE00001477685 +ENSE00003553212 +ENSE00003470263 +ENSE00003472793 +ENSE00003647310 +ENSE00003465003 +ENSE00003649862 +ENSE00003688902 +ENSE00003533538 +ENSE00003546186 +ENSE00003552203 +ENSE00003472855 +ENSE00003605114 +ENSE00003517403 +ENSE00003655153 +ENSE00003582994 +ENSE00003543912 +ENSE00003684947 +ENSE00003557083 +ENSE00003535221 +ENSE00003534549 +ENSE00003559057 +ENSE00003650873 +ENSE00003516954 +ENSE00003534507 +ENSE00003616922 +ENSE00003591218 +ENSE00001940753 +ENSE00003653363 +ENSE00003541907 +ENSE00001923708 +ENSE00003492751 +ENSE00003466854 +ENSE00003571083 +ENSE00003685158 +ENSE00003658295 +ENSE00001826643 +ENSE00003609797 +ENSE00003596489 +ENSE00001432737 +ENSE00001697293 +ENSE00003540997 +ENSE00001701479 +ENSE00001834994 +ENSE00001887073 +ENSE00001783927 +ENSE00001420069 +ENSE00002048533 +ENSE00003700259 +ENSE00001222906 +ENSE00001598723 +ENSE00003695128 +ENSE00001754112 +ENSE00002087812 +ENSE00003480863 +ENSE00003516886 +ENSE00001882136 +ENSE00002034212 +ENSE00003695725 +ENSE00003662380 +ENSE00001846205 +ENSE00003697266 +ENSE00003700221 +ENSE00003696962 +ENSE00003701239 +ENSE00003700688 +ENSE00003700436 +ENSE00003700645 +ENSE00003695760 +ENSE00003695658 +ENSE00003699089 +ENSE00003702178 +ENSE00003701451 +ENSE00001582537 +ENSE00003699052 +ENSE00003701293 +ENSE00003697785 +ENSE00003698430 +ENSE00001905893 +ENSE00003697875 +ENSE00003699796 +ENSE00003701636 +ENSE00003701891 +ENSE00003696062 +ENSE00003700534 +ENSE00003698226 +ENSE00003697832 +ENSE00003700833 +ENSE00003698886 +ENSE00002081080 +ENSE00002068021 +ENSE00001759023 +ENSE00001875784 +ENSE00001477317 +ENSE00001477303 diff --git a/pygtftk/data/mini_real_10M/ids_minus.gtf b/pygtftk/data/mini_real_10M/ids_minus.gtf new file mode 100644 index 00000000..c8de7cb0 --- /dev/null +++ b/pygtftk/data/mini_real_10M/ids_minus.gtf @@ -0,0 +1,461 @@ +chr1 havana transcript 1373730 1375157 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000338370"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 ensembl_havana three_prime_utr 1373730 1373800 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000338338"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 ensembl_havana transcript 1373730 1375495 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000338338"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 ensembl_havana exon 1373730 1373902 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000338338"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001611509"; gene_name "AURKAIP1"; +chr1 havana three_prime_utr 1373730 1373800 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000338370"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana exon 1373730 1373902 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000338370"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001611509"; gene_name "AURKAIP1"; +chr1 havana transcript 1373732 1375169 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000321751"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana exon 1373732 1373902 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000321751"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001790281"; gene_name "AURKAIP1"; +chr1 havana three_prime_utr 1373732 1373800 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000321751"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana three_prime_utr 1373737 1373800 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000378853"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana exon 1373737 1373902 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000378853"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001842703"; gene_name "AURKAIP1"; +chr1 havana transcript 1373737 1375173 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000378853"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana stop_codon 1373801 1373803 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000321751"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 ensembl_havana stop_codon 1373801 1373803 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000338338"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana stop_codon 1373801 1373803 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000338370"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana stop_codon 1373801 1373803 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000378853"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana CDS 1373804 1373902 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000321751"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; protein_id "ENSP00000319778"; gene_name "AURKAIP1"; +chr1 havana CDS 1373804 1373902 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000338370"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; protein_id "ENSP00000342676"; gene_name "AURKAIP1"; +chr1 havana CDS 1373804 1373902 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000378853"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; protein_id "ENSP00000368130"; gene_name "AURKAIP1"; +chr1 ensembl_havana CDS 1373804 1373902 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000338338"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; protein_id "ENSP00000340656"; gene_name "AURKAIP1"; +chr1 ensembl_havana CDS 1374000 1374445 0 - 2 gene_id "ENSG00000175756"; transcript_id "ENST00000338338"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; protein_id "ENSP00000340656"; gene_name "AURKAIP1"; +chr1 havana CDS 1374000 1374445 0 - 2 gene_id "ENSG00000175756"; transcript_id "ENST00000338370"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; protein_id "ENSP00000342676"; gene_name "AURKAIP1"; +chr1 havana exon 1374000 1374445 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000321751"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001629775"; gene_name "AURKAIP1"; +chr1 ensembl_havana exon 1374000 1374445 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000338338"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001629775"; gene_name "AURKAIP1"; +chr1 havana CDS 1374000 1374445 0 - 2 gene_id "ENSG00000175756"; transcript_id "ENST00000321751"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; protein_id "ENSP00000319778"; gene_name "AURKAIP1"; +chr1 havana exon 1374000 1374445 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000338370"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001629775"; gene_name "AURKAIP1"; +chr1 havana CDS 1374000 1374445 0 - 2 gene_id "ENSG00000175756"; transcript_id "ENST00000378853"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; protein_id "ENSP00000368130"; gene_name "AURKAIP1"; +chr1 havana exon 1374000 1374445 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000378853"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001629775"; gene_name "AURKAIP1"; +chr1 havana transcript 1374244 1375144 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000489799"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; gene_name "AURKAIP1"; +chr1 havana exon 1374244 1374790 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000489799"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001922199"; gene_name "AURKAIP1"; +chr1 havana exon 1374438 1374590 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000496905"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001821535"; gene_name "AURKAIP1"; +chr1 havana transcript 1374438 1375159 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000496905"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; gene_name "AURKAIP1"; +chr1 ensembl_havana exon 1374705 1374790 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000338338"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001789693"; gene_name "AURKAIP1"; +chr1 havana exon 1374705 1375159 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000496905"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001896016"; gene_name "AURKAIP1"; +chr1 havana CDS 1374705 1374756 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000321751"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; protein_id "ENSP00000319778"; gene_name "AURKAIP1"; +chr1 havana exon 1374705 1375157 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000338370"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001223521"; gene_name "AURKAIP1"; +chr1 havana CDS 1374705 1374756 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000338370"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; protein_id "ENSP00000342676"; gene_name "AURKAIP1"; +chr1 havana exon 1374705 1374790 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000321751"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001789693"; gene_name "AURKAIP1"; +chr1 ensembl_havana CDS 1374705 1374756 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000338338"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; protein_id "ENSP00000340656"; gene_name "AURKAIP1"; +chr1 havana exon 1374705 1374790 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000378853"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001789693"; gene_name "AURKAIP1"; +chr1 havana CDS 1374705 1374756 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000378853"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; protein_id "ENSP00000368130"; gene_name "AURKAIP1"; +chr1 havana start_codon 1374754 1374756 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000378853"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana start_codon 1374754 1374756 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000338370"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana start_codon 1374754 1374756 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000321751"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 ensembl_havana start_codon 1374754 1374756 0 - 0 gene_id "ENSG00000175756"; transcript_id "ENST00000338338"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 ensembl_havana five_prime_utr 1374757 1374790 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000338338"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana five_prime_utr 1374757 1375157 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000338370"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana five_prime_utr 1374757 1374790 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000321751"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana five_prime_utr 1374757 1374790 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000378853"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana five_prime_utr 1374997 1375173 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000378853"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 havana exon 1374997 1375144 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000489799"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001921648"; gene_name "AURKAIP1"; +chr1 havana exon 1374997 1375173 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000378853"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001479025"; gene_name "AURKAIP1"; +chr1 havana exon 1375075 1375169 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000321751"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001479027"; gene_name "AURKAIP1"; +chr1 havana five_prime_utr 1375075 1375169 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000321751"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 ensembl_havana exon 1375154 1375495 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000338338"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; exon_id "ENSE00001697866"; gene_name "AURKAIP1"; +chr1 ensembl_havana five_prime_utr 1375154 1375495 0 - -1 gene_id "ENSG00000175756"; transcript_id "ENST00000338338"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS25"; gene_name "AURKAIP1"; +chr1 ensembl_havana transcript 1917590 1918797 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000378602"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "TMEM52"; +chr1 ensembl_havana exon 1917590 1918162 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000378602"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001478064"; gene_name "TMEM52"; +chr1 ensembl_havana three_prime_utr 1917590 1917881 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000378602"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "TMEM52"; +chr1 ensembl_havana three_prime_utr 1917591 1917881 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; gene_name "TMEM52"; +chr1 ensembl_havana transcript 1917591 1919273 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; gene_name "TMEM52"; +chr1 ensembl_havana exon 1917591 1918162 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; exon_id "ENSE00001754010"; gene_name "TMEM52"; +chr1 havana three_prime_utr 1917845 1917952 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000378598"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "TMEM52"; +chr1 havana exon 1917845 1918071 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000378598"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001478051"; gene_name "TMEM52"; +chr1 havana transcript 1917845 1919258 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000378598"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "TMEM52"; +chr1 ensembl_havana stop_codon 1917882 1917884 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; gene_name "TMEM52"; +chr1 ensembl_havana stop_codon 1917882 1917884 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000378602"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "TMEM52"; +chr1 ensembl_havana CDS 1917885 1918162 0 - 2 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; protein_id "ENSP00000311122"; gene_name "TMEM52"; +chr1 ensembl_havana CDS 1917885 1918162 0 - 2 gene_id "ENSG00000178821"; transcript_id "ENST00000378602"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367865"; gene_name "TMEM52"; +chr1 havana exon 1917937 1918162 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000470931"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00001810932"; gene_name "TMEM52"; +chr1 havana transcript 1917937 1919270 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000470931"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "TMEM52"; +chr1 havana three_prime_utr 1917937 1918162 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000470931"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "TMEM52"; +chr1 havana stop_codon 1917953 1917955 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000378598"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "TMEM52"; +chr1 havana CDS 1917956 1918071 0 - 2 gene_id "ENSG00000178821"; transcript_id "ENST00000378598"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367861"; gene_name "TMEM52"; +chr1 havana transcript 1918099 1919269 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000602604"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; gene_name "TMEM52"; +chr1 havana exon 1918099 1918162 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000602604"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003350147"; gene_name "TMEM52"; +chr1 havana exon 1918253 1918934 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000602604"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003428438"; gene_name "TMEM52"; +chr1 havana exon 1918253 1918431 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000470931"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003652520"; gene_name "TMEM52"; +chr1 havana three_prime_utr 1918253 1918431 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000470931"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "TMEM52"; +chr1 ensembl_havana CDS 1918253 1918431 0 - 1 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; protein_id "ENSP00000311122"; gene_name "TMEM52"; +chr1 ensembl_havana exon 1918253 1918431 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; exon_id "ENSE00003675447"; gene_name "TMEM52"; +chr1 ensembl_havana exon 1918253 1918797 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000378602"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001858191"; gene_name "TMEM52"; +chr1 ensembl_havana CDS 1918253 1918556 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000378602"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367865"; gene_name "TMEM52"; +chr1 havana transcript 1918386 1919269 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000416272"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "TMEM52"; +chr1 havana exon 1918386 1918431 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000416272"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001682091"; gene_name "TMEM52"; +chr1 havana CDS 1918386 1918431 0 - 1 gene_id "ENSG00000178821"; transcript_id "ENST00000416272"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000409669"; gene_name "TMEM52"; +chr1 ensembl_havana start_codon 1918554 1918556 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000378602"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "TMEM52"; +chr1 ensembl_havana five_prime_utr 1918557 1918797 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000378602"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "TMEM52"; +chr1 havana CDS 1918893 1918934 0 - 2 gene_id "ENSG00000178821"; transcript_id "ENST00000378598"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367861"; gene_name "TMEM52"; +chr1 havana exon 1918893 1918934 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000378598"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003599669"; gene_name "TMEM52"; +chr1 havana CDS 1918893 1918934 0 - 1 gene_id "ENSG00000178821"; transcript_id "ENST00000416272"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000409669"; gene_name "TMEM52"; +chr1 havana exon 1918893 1918934 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000416272"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003634508"; gene_name "TMEM52"; +chr1 ensembl_havana exon 1918893 1918934 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; exon_id "ENSE00003634508"; gene_name "TMEM52"; +chr1 havana exon 1918893 1919088 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000470931"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00001937932"; gene_name "TMEM52"; +chr1 havana three_prime_utr 1918893 1919040 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000470931"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "TMEM52"; +chr1 ensembl_havana CDS 1918893 1918934 0 - 1 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; protein_id "ENSP00000311122"; gene_name "TMEM52"; +chr1 havana stop_codon 1919041 1919043 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000470931"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "TMEM52"; +chr1 havana CDS 1919044 1919088 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000470931"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; protein_id "ENSP00000473350"; gene_name "TMEM52"; +chr1 havana exon 1919045 1919269 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000416272"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001767147"; gene_name "TMEM52"; +chr1 havana exon 1919045 1919258 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000378598"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001736550"; gene_name "TMEM52"; +chr1 havana CDS 1919045 1919265 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000416272"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000409669"; gene_name "TMEM52"; +chr1 havana CDS 1919045 1919258 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000378598"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367861"; gene_name "TMEM52"; +chr1 ensembl_havana exon 1919045 1919088 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; exon_id "ENSE00003473336"; gene_name "TMEM52"; +chr1 ensembl_havana CDS 1919045 1919088 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; protein_id "ENSP00000311122"; gene_name "TMEM52"; +chr1 havana exon 1919045 1919088 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000602604"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003561172"; gene_name "TMEM52"; +chr1 havana exon 1919182 1919269 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000602604"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003343061"; gene_name "TMEM52"; +chr1 havana CDS 1919182 1919265 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000470931"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; protein_id "ENSP00000473350"; gene_name "TMEM52"; +chr1 havana exon 1919182 1919270 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000470931"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003293243"; gene_name "TMEM52"; +chr1 ensembl_havana CDS 1919182 1919265 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; protein_id "ENSP00000311122"; gene_name "TMEM52"; +chr1 ensembl_havana exon 1919182 1919273 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; exon_id "ENSE00001239803"; gene_name "TMEM52"; +chr1 havana start_codon 1919263 1919265 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000470931"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "TMEM52"; +chr1 ensembl_havana start_codon 1919263 1919265 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; gene_name "TMEM52"; +chr1 havana start_codon 1919263 1919265 0 - 0 gene_id "ENSG00000178821"; transcript_id "ENST00000416272"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "TMEM52"; +chr1 havana five_prime_utr 1919266 1919270 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000470931"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "TMEM52"; +chr1 ensembl_havana five_prime_utr 1919266 1919273 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000310991"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS35"; gene_name "TMEM52"; +chr1 havana five_prime_utr 1919266 1919269 0 - -1 gene_id "ENSG00000178821"; transcript_id "ENST00000416272"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "TMEM52"; +chr1 ensembl transcript 2184461 2194775 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000400919"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72686"; gene_name "FAAP20"; +chr1 ensembl exon 2184461 2185513 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000400919"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72686"; exon_id "ENSE00003475992"; gene_name "FAAP20"; +chr1 ensembl three_prime_utr 2184461 2185277 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000400919"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72686"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2184464 2185513 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000469733"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001817609"; gene_name "FAAP20"; +chr1 ensembl_havana transcript 2184464 2207733 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000469733"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; gene_name "FAAP20"; +chr1 havana three_prime_utr 2184478 2185513 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 havana exon 2184478 2185513 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003589214"; gene_name "FAAP20"; +chr1 havana transcript 2184478 2194775 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 ensembl_havana three_prime_utr 2184478 2185513 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2184478 2185513 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003589214"; gene_name "FAAP20"; +chr1 ensembl_havana transcript 2184478 2194741 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 havana exon 2185175 2185513 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000400918"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72687"; exon_id "ENSE00001635485"; gene_name "FAAP20"; +chr1 havana transcript 2185175 2194751 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000400918"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72687"; gene_name "FAAP20"; +chr1 havana three_prime_utr 2185175 2185470 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000400918"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72687"; gene_name "FAAP20"; +chr1 ensembl stop_codon 2185278 2185280 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000400919"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72686"; gene_name "FAAP20"; +chr1 ensembl CDS 2185281 2185513 0 - 2 gene_id "ENSG00000162585"; transcript_id "ENST00000400919"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72686"; protein_id "ENSP00000383710"; gene_name "FAAP20"; +chr1 havana stop_codon 2185471 2185473 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000400918"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72687"; gene_name "FAAP20"; +chr1 havana CDS 2185474 2185513 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000400918"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72687"; protein_id "ENSP00000383709"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2186004 2186249 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003459358"; gene_name "FAAP20"; +chr1 ensembl_havana three_prime_utr 2186004 2186249 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 havana three_prime_utr 2186004 2186249 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 havana exon 2186004 2186249 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003459358"; gene_name "FAAP20"; +chr1 havana exon 2186838 2187206 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003626371"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2186838 2187206 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003526713"; gene_name "FAAP20"; +chr1 ensembl_havana three_prime_utr 2186838 2187206 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 havana three_prime_utr 2186838 2187157 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 havana stop_codon 2187158 2187160 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 havana CDS 2187161 2187206 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; protein_id "ENSP00000410450"; gene_name "FAAP20"; +chr1 havana transcript 2189544 2194108 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000497675"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; gene_name "FAAP20"; +chr1 havana exon 2189544 2193910 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000497675"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001862783"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2189548 2189781 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000487186"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003569320"; gene_name "FAAP20"; +chr1 havana exon 2189548 2189781 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000378543"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS57965"; exon_id "ENSE00003681657"; gene_name "FAAP20"; +chr1 havana three_prime_utr 2189548 2189776 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000378543"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS57965"; gene_name "FAAP20"; +chr1 havana three_prime_utr 2189548 2189708 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000378546"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS38"; gene_name "FAAP20"; +chr1 havana exon 2189548 2189781 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000401813"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003569320"; gene_name "FAAP20"; +chr1 havana exon 2189548 2189781 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000378546"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS38"; exon_id "ENSE00003483048"; gene_name "FAAP20"; +chr1 havana transcript 2189548 2194774 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000378546"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS38"; gene_name "FAAP20"; +chr1 havana transcript 2189548 2194750 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000378543"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS57965"; gene_name "FAAP20"; +chr1 havana transcript 2189548 2199907 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000401813"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; gene_name "FAAP20"; +chr1 ensembl_havana transcript 2189548 2212720 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000487186"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; gene_name "FAAP20"; +chr1 havana exon 2189569 2189781 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000476803"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001951400"; gene_name "FAAP20"; +chr1 havana transcript 2189569 2194213 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000476803"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; gene_name "FAAP20"; +chr1 havana three_prime_utr 2189580 2189781 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000440825"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 havana transcript 2189580 2194739 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000440825"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 havana exon 2189580 2189781 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000440825"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00002033745"; gene_name "FAAP20"; +chr1 havana stop_codon 2189709 2189711 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000378546"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS38"; gene_name "FAAP20"; +chr1 havana CDS 2189712 2189781 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000378546"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS38"; protein_id "ENSP00000367808"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2189713 2189781 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003636009"; gene_name "FAAP20"; +chr1 havana CDS 2189713 2189781 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; protein_id "ENSP00000410450"; gene_name "FAAP20"; +chr1 ensembl_havana three_prime_utr 2189713 2189781 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 havana exon 2189713 2189781 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003529933"; gene_name "FAAP20"; +chr1 havana stop_codon 2189777 2189779 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000378543"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS57965"; gene_name "FAAP20"; +chr1 havana CDS 2189780 2189781 0 - 2 gene_id "ENSG00000162585"; transcript_id "ENST00000378543"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS57965"; protein_id "ENSP00000367804"; gene_name "FAAP20"; +chr1 havana exon 2191901 2192975 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000420515"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001602311"; gene_name "FAAP20"; +chr1 havana transcript 2191901 2194748 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000420515"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "FAAP20"; +chr1 havana three_prime_utr 2191901 2192857 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000420515"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "FAAP20"; +chr1 havana exon 2192647 2192975 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000440825"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00001720216"; gene_name "FAAP20"; +chr1 havana three_prime_utr 2192647 2192857 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000440825"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2192845 2192975 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003630334"; gene_name "FAAP20"; +chr1 ensembl_havana three_prime_utr 2192845 2192857 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 ensembl_havana stop_codon 2192858 2192860 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 havana stop_codon 2192858 2192860 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000440825"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 havana stop_codon 2192858 2192860 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000420515"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "FAAP20"; +chr1 ensembl_havana CDS 2192861 2192975 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; protein_id "ENSP00000405430"; gene_name "FAAP20"; +chr1 havana CDS 2192861 2192975 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000440825"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; protein_id "ENSP00000410740"; gene_name "FAAP20"; +chr1 havana CDS 2192861 2192975 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000420515"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000409721"; gene_name "FAAP20"; +chr1 havana exon 2193639 2193910 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000476803"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003481862"; gene_name "FAAP20"; +chr1 havana CDS 2193639 2193910 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000378546"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS38"; protein_id "ENSP00000367808"; gene_name "FAAP20"; +chr1 havana CDS 2193639 2193910 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; protein_id "ENSP00000410450"; gene_name "FAAP20"; +chr1 havana CDS 2193639 2193910 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000400918"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72687"; protein_id "ENSP00000383709"; gene_name "FAAP20"; +chr1 havana exon 2193639 2193910 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003510741"; gene_name "FAAP20"; +chr1 havana exon 2193639 2193910 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000378546"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS38"; exon_id "ENSE00003510741"; gene_name "FAAP20"; +chr1 ensembl exon 2193639 2193910 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000400919"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72686"; exon_id "ENSE00003548540"; gene_name "FAAP20"; +chr1 ensembl CDS 2193639 2193910 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000400919"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72686"; protein_id "ENSP00000383710"; gene_name "FAAP20"; +chr1 havana exon 2193639 2193910 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000400918"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72687"; exon_id "ENSE00003510741"; gene_name "FAAP20"; +chr1 havana exon 2193639 2193910 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000440825"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003510741"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2193639 2193910 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000487186"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003481862"; gene_name "FAAP20"; +chr1 havana CDS 2193639 2193910 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000420515"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000409721"; gene_name "FAAP20"; +chr1 havana exon 2193639 2193910 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000378543"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS57965"; exon_id "ENSE00003548540"; gene_name "FAAP20"; +chr1 havana CDS 2193639 2193910 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000378543"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS57965"; protein_id "ENSP00000367804"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2193639 2193910 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003510741"; gene_name "FAAP20"; +chr1 havana CDS 2193639 2193910 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000440825"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; protein_id "ENSP00000410740"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2193639 2193910 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000469733"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003481862"; gene_name "FAAP20"; +chr1 havana exon 2193639 2193910 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000420515"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003510741"; gene_name "FAAP20"; +chr1 havana exon 2193639 2193910 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000401813"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003481862"; gene_name "FAAP20"; +chr1 ensembl_havana CDS 2193639 2193910 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; protein_id "ENSP00000405430"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2193998 2194133 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000487186"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003634783"; gene_name "FAAP20"; +chr1 havana exon 2193998 2194133 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003467961"; gene_name "FAAP20"; +chr1 havana exon 2193998 2194108 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000497675"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001841545"; gene_name "FAAP20"; +chr1 havana exon 2193998 2194133 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000378546"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS38"; exon_id "ENSE00003467961"; gene_name "FAAP20"; +chr1 havana CDS 2193998 2194133 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000378546"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS38"; protein_id "ENSP00000367808"; gene_name "FAAP20"; +chr1 havana CDS 2193998 2194133 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; protein_id "ENSP00000410450"; gene_name "FAAP20"; +chr1 havana exon 2193998 2194213 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000476803"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001816369"; gene_name "FAAP20"; +chr1 havana CDS 2193998 2194133 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000400918"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72687"; protein_id "ENSP00000383709"; gene_name "FAAP20"; +chr1 ensembl_havana CDS 2193998 2194133 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; protein_id "ENSP00000405430"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2193998 2194133 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003467961"; gene_name "FAAP20"; +chr1 havana exon 2193998 2194133 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000420515"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003467961"; gene_name "FAAP20"; +chr1 havana exon 2193998 2194133 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000400918"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72687"; exon_id "ENSE00003467961"; gene_name "FAAP20"; +chr1 havana CDS 2193998 2194133 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000420515"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000409721"; gene_name "FAAP20"; +chr1 havana exon 2193998 2194133 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000401813"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003634783"; gene_name "FAAP20"; +chr1 havana CDS 2194688 2194748 0 - 2 gene_id "ENSG00000162585"; transcript_id "ENST00000420515"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000409721"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2194688 2194741 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00003618179"; gene_name "FAAP20"; +chr1 ensembl_havana CDS 2194688 2194741 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000428120"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; protein_id "ENSP00000405430"; gene_name "FAAP20"; +chr1 havana exon 2194688 2194748 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000420515"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001545345"; gene_name "FAAP20"; +chr1 ensembl CDS 2194688 2194749 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000400919"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72686"; protein_id "ENSP00000383710"; gene_name "FAAP20"; +chr1 havana CDS 2194688 2194749 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000378546"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS38"; protein_id "ENSP00000367808"; gene_name "FAAP20"; +chr1 havana exon 2194688 2194774 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000378546"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS38"; exon_id "ENSE00001822711"; gene_name "FAAP20"; +chr1 havana CDS 2194688 2194749 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000400918"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72687"; protein_id "ENSP00000383709"; gene_name "FAAP20"; +chr1 havana exon 2194688 2194775 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00002226200"; gene_name "FAAP20"; +chr1 havana CDS 2194688 2194749 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; protein_id "ENSP00000410450"; gene_name "FAAP20"; +chr1 havana CDS 2194688 2194749 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000378543"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS57965"; protein_id "ENSP00000367804"; gene_name "FAAP20"; +chr1 havana exon 2194688 2194750 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000378543"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS57965"; exon_id "ENSE00001477870"; gene_name "FAAP20"; +chr1 havana CDS 2194688 2194739 0 - 1 gene_id "ENSG00000162585"; transcript_id "ENST00000440825"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; protein_id "ENSP00000410740"; gene_name "FAAP20"; +chr1 ensembl exon 2194688 2194775 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000400919"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72686"; exon_id "ENSE00002226200"; gene_name "FAAP20"; +chr1 havana exon 2194688 2194751 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000400918"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72687"; exon_id "ENSE00001816144"; gene_name "FAAP20"; +chr1 havana exon 2194688 2194739 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000440825"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; exon_id "ENSE00001720995"; gene_name "FAAP20"; +chr1 havana start_codon 2194747 2194749 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000400918"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72687"; gene_name "FAAP20"; +chr1 ensembl start_codon 2194747 2194749 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000400919"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72686"; gene_name "FAAP20"; +chr1 havana start_codon 2194747 2194749 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 havana start_codon 2194747 2194749 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000378543"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS57965"; gene_name "FAAP20"; +chr1 havana start_codon 2194747 2194749 0 - 0 gene_id "ENSG00000162585"; transcript_id "ENST00000378546"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS38"; gene_name "FAAP20"; +chr1 havana five_prime_utr 2194750 2194775 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000414253"; gene_biotype "protein_coding"; transcript_biotype "nonsense_mediated_decay"; gene_name "FAAP20"; +chr1 havana five_prime_utr 2194750 2194751 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000400918"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72687"; gene_name "FAAP20"; +chr1 havana five_prime_utr 2194750 2194750 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000378543"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS57965"; gene_name "FAAP20"; +chr1 ensembl five_prime_utr 2194750 2194775 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000400919"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS72686"; gene_name "FAAP20"; +chr1 havana five_prime_utr 2194750 2194774 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000378546"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS38"; gene_name "FAAP20"; +chr1 havana exon 2198007 2199907 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000401813"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00002040955"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2198007 2198142 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000469733"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003615416"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2198007 2198142 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000487186"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003615416"; gene_name "FAAP20"; +chr1 havana exon 2198063 2198142 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000514625"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00002044438"; gene_name "FAAP20"; +chr1 havana transcript 2198063 2203882 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000514625"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2198754 2201225 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000487186"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001853635"; gene_name "FAAP20"; +chr1 havana exon 2201050 2201225 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000514625"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001859055"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2201050 2201225 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000469733"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001859055"; gene_name "FAAP20"; +chr1 havana exon 2203436 2203882 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000514625"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00002034769"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2203436 2203630 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000469733"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001916683"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2203564 2203630 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000487186"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001937728"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2206305 2206424 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000469733"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001845014"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2206515 2206667 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000469733"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001908868"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2207556 2207733 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000469733"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001934415"; gene_name "FAAP20"; +chr1 havana exon 2212171 2212458 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000420964"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001714381"; gene_name "FAAP20"; +chr1 havana transcript 2212171 2212574 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000420964"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2212372 2212458 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000487186"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001821386"; gene_name "FAAP20"; +chr1 havana exon 2212549 2212574 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000420964"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001724829"; gene_name "FAAP20"; +chr1 ensembl_havana exon 2212549 2212720 0 - -1 gene_id "ENSG00000162585"; transcript_id "ENST00000487186"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001927358"; gene_name "FAAP20"; +chr1 havana transcript 3630767 3650058 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 ensembl_havana three_prime_utr 3630767 3630974 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; gene_name "WRAP73"; +chr1 havana exon 3630767 3631657 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001755234"; gene_name "WRAP73"; +chr1 havana three_prime_utr 3630767 3631397 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 ensembl_havana transcript 3630767 3650073 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; gene_name "WRAP73"; +chr1 ensembl_havana exon 3630767 3631117 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; exon_id "ENSE00001697450"; gene_name "WRAP73"; +chr1 ensembl_havana stop_codon 3630975 3630977 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; gene_name "WRAP73"; +chr1 ensembl_havana CDS 3630978 3631117 0 - 2 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; protein_id "ENSP00000270708"; gene_name "WRAP73"; +chr1 havana stop_codon 3631398 3631400 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 havana CDS 3631401 3631657 0 - 2 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367573"; gene_name "WRAP73"; +chr1 ensembl_havana exon 3631466 3631657 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; exon_id "ENSE00001797222"; gene_name "WRAP73"; +chr1 ensembl_havana CDS 3631466 3631657 0 - 2 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; protein_id "ENSP00000270708"; gene_name "WRAP73"; +chr1 havana transcript 3631886 3639625 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000471223"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; gene_name "WRAP73"; +chr1 havana exon 3631886 3637098 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000471223"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001862304"; gene_name "WRAP73"; +chr1 havana CDS 3632213 3632338 0 - 2 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000416192"; gene_name "WRAP73"; +chr1 ensembl_havana exon 3632213 3632338 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; exon_id "ENSE00003789737"; gene_name "WRAP73"; +chr1 ensembl_havana CDS 3632213 3632338 0 - 2 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; protein_id "ENSP00000270708"; gene_name "WRAP73"; +chr1 havana CDS 3632213 3632338 0 - 2 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367573"; gene_name "WRAP73"; +chr1 havana transcript 3632213 3650026 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 havana exon 3632213 3632338 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003789737"; gene_name "WRAP73"; +chr1 havana exon 3632213 3632338 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003789737"; gene_name "WRAP73"; +chr1 havana exon 3632766 3633503 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000497940"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001852362"; gene_name "WRAP73"; +chr1 havana transcript 3632766 3637057 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000497940"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; gene_name "WRAP73"; +chr1 havana transcript 3633310 3635450 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000469643"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; gene_name "WRAP73"; +chr1 havana exon 3633310 3633503 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000469643"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001924010"; gene_name "WRAP73"; +chr1 havana CDS 3633398 3633503 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000416192"; gene_name "WRAP73"; +chr1 havana exon 3633398 3633503 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001659258"; gene_name "WRAP73"; +chr1 havana CDS 3633398 3633503 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367573"; gene_name "WRAP73"; +chr1 havana exon 3633398 3633503 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001659258"; gene_name "WRAP73"; +chr1 ensembl_havana exon 3633398 3633503 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; exon_id "ENSE00001659258"; gene_name "WRAP73"; +chr1 ensembl_havana CDS 3633398 3633503 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; protein_id "ENSP00000270708"; gene_name "WRAP73"; +chr1 havana exon 3634916 3635074 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000494884"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001813324"; gene_name "WRAP73"; +chr1 havana transcript 3634916 3635433 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000494884"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; gene_name "WRAP73"; +chr1 havana exon 3634997 3635074 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003685083"; gene_name "WRAP73"; +chr1 havana CDS 3634997 3635074 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367573"; gene_name "WRAP73"; +chr1 ensembl_havana CDS 3634997 3635074 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; protein_id "ENSP00000270708"; gene_name "WRAP73"; +chr1 havana exon 3634997 3635074 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000497940"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003653006"; gene_name "WRAP73"; +chr1 havana CDS 3634997 3635074 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000416192"; gene_name "WRAP73"; +chr1 havana exon 3634997 3635074 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003685083"; gene_name "WRAP73"; +chr1 ensembl_havana exon 3634997 3635074 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; exon_id "ENSE00003685083"; gene_name "WRAP73"; +chr1 havana exon 3634997 3635074 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000469643"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003653006"; gene_name "WRAP73"; +chr1 havana CDS 3635014 3635074 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000463084"; gene_name "WRAP73"; +chr1 havana transcript 3635014 3652761 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 havana exon 3635014 3635074 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001866903"; gene_name "WRAP73"; +chr1 ensembl_havana CDS 3635160 3635294 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; protein_id "ENSP00000270708"; gene_name "WRAP73"; +chr1 ensembl_havana exon 3635160 3635294 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; exon_id "ENSE00003492457"; gene_name "WRAP73"; +chr1 havana exon 3635160 3635433 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000494884"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001896684"; gene_name "WRAP73"; +chr1 havana CDS 3635160 3635294 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367573"; gene_name "WRAP73"; +chr1 havana exon 3635160 3635294 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003492457"; gene_name "WRAP73"; +chr1 havana CDS 3635160 3635294 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000463084"; gene_name "WRAP73"; +chr1 havana exon 3635160 3635294 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003492457"; gene_name "WRAP73"; +chr1 havana exon 3635160 3635294 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000497940"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003669982"; gene_name "WRAP73"; +chr1 havana exon 3635160 3635450 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000469643"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001839399"; gene_name "WRAP73"; +chr1 havana CDS 3635272 3635294 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389738"; gene_name "WRAP73"; +chr1 havana exon 3635272 3635294 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003387437"; gene_name "WRAP73"; +chr1 havana transcript 3635272 3650063 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 havana exon 3635944 3636030 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003480267"; gene_name "WRAP73"; +chr1 ensembl_havana CDS 3635944 3636030 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; protein_id "ENSP00000270708"; gene_name "WRAP73"; +chr1 havana exon 3635944 3636030 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000497940"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003485438"; gene_name "WRAP73"; +chr1 havana exon 3635944 3636030 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003480267"; gene_name "WRAP73"; +chr1 ensembl_havana exon 3635944 3636030 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; exon_id "ENSE00003480267"; gene_name "WRAP73"; +chr1 havana CDS 3635944 3636030 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000416192"; gene_name "WRAP73"; +chr1 havana exon 3635944 3636030 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003480267"; gene_name "WRAP73"; +chr1 havana CDS 3635944 3636030 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000463084"; gene_name "WRAP73"; +chr1 havana CDS 3635944 3636030 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367573"; gene_name "WRAP73"; +chr1 havana CDS 3636995 3637098 0 - 2 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389738"; gene_name "WRAP73"; +chr1 havana exon 3636995 3637057 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000497940"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001857368"; gene_name "WRAP73"; +chr1 havana exon 3636995 3637098 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00000734306"; gene_name "WRAP73"; +chr1 havana exon 3636995 3637098 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00000734306"; gene_name "WRAP73"; +chr1 havana exon 3636995 3637098 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00000734306"; gene_name "WRAP73"; +chr1 havana CDS 3636995 3637098 0 - 2 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000416192"; gene_name "WRAP73"; +chr1 havana exon 3636995 3637098 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00000734306"; gene_name "WRAP73"; +chr1 havana CDS 3636995 3637098 0 - 2 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367573"; gene_name "WRAP73"; +chr1 ensembl_havana CDS 3636995 3637098 0 - 2 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; protein_id "ENSP00000270708"; gene_name "WRAP73"; +chr1 ensembl_havana exon 3636995 3637098 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; exon_id "ENSE00000734306"; gene_name "WRAP73"; +chr1 havana CDS 3636995 3637098 0 - 2 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000463084"; gene_name "WRAP73"; +chr1 havana CDS 3638750 3638822 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000416192"; gene_name "WRAP73"; +chr1 havana exon 3638750 3638822 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00000734303"; gene_name "WRAP73"; +chr1 havana exon 3638750 3638822 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00000734303"; gene_name "WRAP73"; +chr1 havana CDS 3638750 3638822 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389738"; gene_name "WRAP73"; +chr1 havana exon 3638750 3638822 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00000734303"; gene_name "WRAP73"; +chr1 havana exon 3638750 3639625 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000471223"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001854631"; gene_name "WRAP73"; +chr1 havana CDS 3638750 3638822 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000463084"; gene_name "WRAP73"; +chr1 havana CDS 3638750 3638822 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367573"; gene_name "WRAP73"; +chr1 ensembl_havana CDS 3638750 3638822 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; protein_id "ENSP00000270708"; gene_name "WRAP73"; +chr1 ensembl_havana exon 3638750 3638822 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; exon_id "ENSE00000734303"; gene_name "WRAP73"; +chr1 havana exon 3638750 3638822 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00000734303"; gene_name "WRAP73"; +chr1 havana exon 3646666 3646782 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00000734299"; gene_name "WRAP73"; +chr1 havana CDS 3646666 3646782 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000416192"; gene_name "WRAP73"; +chr1 havana exon 3646666 3646782 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00000734299"; gene_name "WRAP73"; +chr1 havana exon 3646666 3646782 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00000734299"; gene_name "WRAP73"; +chr1 havana CDS 3646666 3646782 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389738"; gene_name "WRAP73"; +chr1 havana exon 3646666 3646782 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00000734299"; gene_name "WRAP73"; +chr1 havana CDS 3646666 3646782 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367573"; gene_name "WRAP73"; +chr1 ensembl_havana exon 3646666 3646782 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; exon_id "ENSE00000734299"; gene_name "WRAP73"; +chr1 ensembl_havana CDS 3646666 3646782 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; protein_id "ENSP00000270708"; gene_name "WRAP73"; +chr1 havana CDS 3646666 3646782 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000463084"; gene_name "WRAP73"; +chr1 havana exon 3647246 3647560 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000479331"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001931622"; gene_name "WRAP73"; +chr1 havana transcript 3647246 3650061 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000479331"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; gene_name "WRAP73"; +chr1 havana CDS 3647408 3647431 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000463084"; gene_name "WRAP73"; +chr1 havana exon 3647408 3647560 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003566716"; gene_name "WRAP73"; +chr1 ensembl_havana CDS 3647408 3647560 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; protein_id "ENSP00000270708"; gene_name "WRAP73"; +chr1 havana exon 3647408 3647560 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003677298"; gene_name "WRAP73"; +chr1 havana CDS 3647408 3647560 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367573"; gene_name "WRAP73"; +chr1 havana CDS 3647408 3647560 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000416192"; gene_name "WRAP73"; +chr1 ensembl_havana exon 3647408 3647560 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; exon_id "ENSE00003566716"; gene_name "WRAP73"; +chr1 havana exon 3647408 3647560 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003566716"; gene_name "WRAP73"; +chr1 havana CDS 3647408 3647560 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389738"; gene_name "WRAP73"; +chr1 havana exon 3647408 3647560 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003566716"; gene_name "WRAP73"; +chr1 havana start_codon 3647429 3647431 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 havana five_prime_utr 3647432 3647560 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 havana exon 3649931 3650058 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001870155"; gene_name "WRAP73"; +chr1 havana CDS 3649931 3649999 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000416192"; gene_name "WRAP73"; +chr1 havana exon 3649931 3650063 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001477063"; gene_name "WRAP73"; +chr1 havana CDS 3649931 3649999 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389738"; gene_name "WRAP73"; +chr1 havana exon 3649931 3650026 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001680820"; gene_name "WRAP73"; +chr1 ensembl_havana exon 3649931 3650073 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; exon_id "ENSE00001748742"; gene_name "WRAP73"; +chr1 ensembl_havana CDS 3649931 3649999 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; protein_id "ENSP00000270708"; gene_name "WRAP73"; +chr1 havana exon 3649931 3650061 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000479331"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001836154"; gene_name "WRAP73"; +chr1 havana CDS 3649931 3649999 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367573"; gene_name "WRAP73"; +chr1 ensembl_havana start_codon 3649997 3649999 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; gene_name "WRAP73"; +chr1 havana start_codon 3649997 3649999 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 havana start_codon 3649997 3649999 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 havana start_codon 3649997 3649999 0 - 0 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 havana five_prime_utr 3650000 3650026 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000424367"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 havana five_prime_utr 3650000 3650063 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000419924"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 havana five_prime_utr 3650000 3650058 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000378322"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 ensembl_havana five_prime_utr 3650000 3650073 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000270708"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS48"; gene_name "WRAP73"; +chr1 havana five_prime_utr 3652713 3652761 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "WRAP73"; +chr1 havana exon 3652713 3652761 0 - -1 gene_id "ENSG00000116213"; transcript_id "ENST00000465916"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001858739"; gene_name "WRAP73"; +chr1 havana transcript 6412418 6424670 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377837"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana exon 6412418 6413282 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377837"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001475277"; gene_name "HES2"; +chr1 havana three_prime_utr 6412418 6413192 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377837"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana exon 6413000 6413282 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377836"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001475269"; gene_name "HES2"; +chr1 havana three_prime_utr 6413000 6413192 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377836"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana transcript 6413000 6419903 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377836"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana transcript 6413050 6416631 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000471190"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; gene_name "HES2"; +chr1 havana exon 6413050 6413282 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000471190"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001890428"; gene_name "HES2"; +chr1 havana stop_codon 6413193 6413195 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377836"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana stop_codon 6413193 6413195 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377837"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana CDS 6413196 6413282 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377836"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367067"; gene_name "HES2"; +chr1 havana CDS 6413196 6413282 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377837"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367068"; gene_name "HES2"; +chr1 ensembl_havana three_prime_utr 6415232 6418872 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377834"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS30574"; gene_name "HES2"; +chr1 ensembl_havana exon 6415232 6419153 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377834"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS30574"; exon_id "ENSE00001475263"; gene_name "HES2"; +chr1 ensembl_havana transcript 6415232 6419919 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377834"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS30574"; gene_name "HES2"; +chr1 havana exon 6416516 6416631 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000471190"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001948071"; gene_name "HES2"; +chr1 havana three_prime_utr 6418414 6419060 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000487437"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana transcript 6418414 6419907 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000487437"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana exon 6418414 6419153 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000487437"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001854189"; gene_name "HES2"; +chr1 havana exon 6418849 6419340 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000489730"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001914446"; gene_name "HES2"; +chr1 havana transcript 6418849 6419917 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000489730"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana three_prime_utr 6418849 6419232 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000489730"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 ensembl_havana stop_codon 6418873 6418875 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377834"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS30574"; gene_name "HES2"; +chr1 ensembl_havana CDS 6418876 6419153 0 - 2 gene_id "ENSG00000069812"; transcript_id "ENST00000377834"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS30574"; protein_id "ENSP00000367065"; gene_name "HES2"; +chr1 havana stop_codon 6419061 6419063 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000487437"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana CDS 6419064 6419153 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000487437"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000465248"; gene_name "HES2"; +chr1 havana stop_codon 6419233 6419235 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000489730"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana CDS 6419236 6419340 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000489730"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000465270"; gene_name "HES2"; +chr1 ensembl_havana CDS 6419241 6419340 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377834"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS30574"; protein_id "ENSP00000367065"; gene_name "HES2"; +chr1 ensembl_havana exon 6419241 6419340 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377834"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS30574"; exon_id "ENSE00000734533"; gene_name "HES2"; +chr1 havana exon 6419607 6419702 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000487437"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00002817476"; gene_name "HES2"; +chr1 ensembl_havana exon 6419607 6419702 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377834"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS30574"; exon_id "ENSE00002817476"; gene_name "HES2"; +chr1 ensembl_havana CDS 6419607 6419702 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377834"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS30574"; protein_id "ENSP00000367065"; gene_name "HES2"; +chr1 havana CDS 6419607 6419702 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000487437"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000465248"; gene_name "HES2"; +chr1 havana exon 6419607 6419702 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000489730"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00002817476"; gene_name "HES2"; +chr1 havana exon 6419607 6419702 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377837"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00002817476"; gene_name "HES2"; +chr1 havana CDS 6419607 6419702 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377837"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367068"; gene_name "HES2"; +chr1 havana CDS 6419607 6419702 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377836"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367067"; gene_name "HES2"; +chr1 havana exon 6419607 6419702 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377836"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00002817476"; gene_name "HES2"; +chr1 havana CDS 6419607 6419702 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000489730"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000465270"; gene_name "HES2"; +chr1 havana CDS 6419776 6419820 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000489730"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000465270"; gene_name "HES2"; +chr1 havana exon 6419776 6419907 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000487437"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001916716"; gene_name "HES2"; +chr1 havana CDS 6419776 6419820 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000487437"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000465248"; gene_name "HES2"; +chr1 ensembl_havana CDS 6419776 6419820 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377834"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS30574"; protein_id "ENSP00000367065"; gene_name "HES2"; +chr1 ensembl_havana exon 6419776 6419919 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377834"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS30574"; exon_id "ENSE00001475267"; gene_name "HES2"; +chr1 havana CDS 6419776 6419820 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377836"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367067"; gene_name "HES2"; +chr1 havana exon 6419776 6419903 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377836"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001475271"; gene_name "HES2"; +chr1 havana exon 6419776 6419917 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000489730"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001835288"; gene_name "HES2"; +chr1 havana exon 6419776 6419843 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377837"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001475281"; gene_name "HES2"; +chr1 havana CDS 6419776 6419820 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377837"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000367068"; gene_name "HES2"; +chr1 havana start_codon 6419818 6419820 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377836"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana start_codon 6419818 6419820 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000489730"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana start_codon 6419818 6419820 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377837"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana start_codon 6419818 6419820 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000487437"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 ensembl_havana start_codon 6419818 6419820 0 - 0 gene_id "ENSG00000069812"; transcript_id "ENST00000377834"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS30574"; gene_name "HES2"; +chr1 ensembl_havana five_prime_utr 6419821 6419919 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377834"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS30574"; gene_name "HES2"; +chr1 havana five_prime_utr 6419821 6419843 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377837"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana five_prime_utr 6419821 6419907 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000487437"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana five_prime_utr 6419821 6419903 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377836"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana five_prime_utr 6419821 6419917 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000489730"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana five_prime_utr 6424478 6424670 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377837"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "HES2"; +chr1 havana exon 6424478 6424670 0 - -1 gene_id "ENSG00000069812"; transcript_id "ENST00000377837"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001150483"; gene_name "HES2"; +chr1 havana transcript 9148011 9182392 0 - -1 gene_id "ENSG00000228526"; transcript_id "ENST00000635687"; gene_biotype "lincRNA"; transcript_biotype "lincRNA"; gene_name "MIR34AHG"; +chr1 havana exon 9148011 9151835 0 - -1 gene_id "ENSG00000228526"; transcript_id "ENST00000635687"; gene_biotype "lincRNA"; transcript_biotype "lincRNA"; exon_id "ENSE00003790229"; gene_name "MIR34AHG"; +chr1 ensembl transcript 9151668 9151777 0 - -1 gene_id "ENSG00000228526"; transcript_id "ENST00000385130"; gene_biotype "lincRNA"; transcript_biotype "miRNA"; gene_name "MIR34AHG"; +chr1 ensembl exon 9151668 9151777 0 - -1 gene_id "ENSG00000228526"; transcript_id "ENST00000385130"; gene_biotype "lincRNA"; transcript_biotype "miRNA"; exon_id "ENSE00001500136"; gene_name "MIR34AHG"; +chr1 havana exon 9182007 9182392 0 - -1 gene_id "ENSG00000228526"; transcript_id "ENST00000635687"; gene_biotype "lincRNA"; transcript_biotype "lincRNA"; exon_id "ENSE00003787977"; gene_name "MIR34AHG"; +chr1 havana transcript 9182007 9183750 0 - -1 gene_id "ENSG00000228526"; transcript_id "ENST00000437157"; gene_biotype "lincRNA"; transcript_biotype "lincRNA"; gene_name "MIR34AHG"; +chr1 havana exon 9182007 9182295 0 - -1 gene_id "ENSG00000228526"; transcript_id "ENST00000437157"; gene_biotype "lincRNA"; transcript_biotype "lincRNA"; exon_id "ENSE00001658885"; gene_name "MIR34AHG"; +chr1 havana exon 9183631 9183750 0 - -1 gene_id "ENSG00000228526"; transcript_id "ENST00000437157"; gene_biotype "lincRNA"; transcript_biotype "lincRNA"; exon_id "ENSE00001670416"; gene_name "MIR34AHG"; diff --git a/pygtftk/data/mini_real_10M/ids_minus.txt b/pygtftk/data/mini_real_10M/ids_minus.txt new file mode 100644 index 00000000..a968df50 --- /dev/null +++ b/pygtftk/data/mini_real_10M/ids_minus.txt @@ -0,0 +1,47 @@ +ENST00000338370 +ENST00000338338 +ENST00000321751 +ENST00000378853 +ENST00000489799 +ENST00000496905 +ENST00000378602 +ENST00000310991 +ENST00000378598 +ENST00000470931 +ENST00000602604 +ENST00000416272 +ENST00000400919 +ENST00000469733 +ENST00000414253 +ENST00000428120 +ENST00000400918 +ENST00000497675 +ENST00000487186 +ENST00000378543 +ENST00000378546 +ENST00000401813 +ENST00000476803 +ENST00000440825 +ENST00000420515 +ENST00000514625 +ENST00000420964 +ENST00000378322 +ENST00000270708 +ENST00000471223 +ENST00000424367 +ENST00000497940 +ENST00000469643 +ENST00000494884 +ENST00000465916 +ENST00000419924 +ENST00000479331 +ENST00000377837 +ENST00000377836 +ENST00000471190 +ENST00000377834 +ENST00000487437 +ENST00000489730 +ENST00000635687 +ENST00000385130 +ENST00000635405 +ENST00000437157 diff --git a/pygtftk/data/mini_real_10M/ids_minus_exon.txt b/pygtftk/data/mini_real_10M/ids_minus_exon.txt new file mode 100644 index 00000000..fdbb151b --- /dev/null +++ b/pygtftk/data/mini_real_10M/ids_minus_exon.txt @@ -0,0 +1,133 @@ +ENSE00001611509 +ENSE00001790281 +ENSE00001842703 +ENSE00001629775 +ENSE00001922199 +ENSE00001821535 +ENSE00001789693 +ENSE00001896016 +ENSE00001223521 +ENSE00001921648 +ENSE00001479025 +ENSE00001479027 +ENSE00001697866 +ENSE00001478064 +ENSE00001754010 +ENSE00001478051 +ENSE00001810932 +ENSE00003350147 +ENSE00003428438 +ENSE00003652520 +ENSE00003675447 +ENSE00001858191 +ENSE00001682091 +ENSE00003599669 +ENSE00003634508 +ENSE00001937932 +ENSE00001767147 +ENSE00001736550 +ENSE00003473336 +ENSE00003561172 +ENSE00003343061 +ENSE00003293243 +ENSE00001239803 +ENSE00003475992 +ENSE00001817609 +ENSE00003589214 +ENSE00001635485 +ENSE00003459358 +ENSE00003626371 +ENSE00003526713 +ENSE00001862783 +ENSE00003569320 +ENSE00003681657 +ENSE00003483048 +ENSE00001951400 +ENSE00002033745 +ENSE00003636009 +ENSE00003529933 +ENSE00001602311 +ENSE00001720216 +ENSE00003630334 +ENSE00003481862 +ENSE00003510741 +ENSE00003548540 +ENSE00003634783 +ENSE00003467961 +ENSE00001841545 +ENSE00001816369 +ENSE00003618179 +ENSE00001545345 +ENSE00001822711 +ENSE00002226200 +ENSE00001477870 +ENSE00001816144 +ENSE00001720995 +ENSE00002040955 +ENSE00003615416 +ENSE00002044438 +ENSE00001853635 +ENSE00001859055 +ENSE00002034769 +ENSE00001916683 +ENSE00001937728 +ENSE00001845014 +ENSE00001908868 +ENSE00001934415 +ENSE00001714381 +ENSE00001821386 +ENSE00001724829 +ENSE00001927358 +ENSE00001755234 +ENSE00001697450 +ENSE00001797222 +ENSE00001862304 +ENSE00003789737 +ENSE00001852362 +ENSE00001924010 +ENSE00001659258 +ENSE00001813324 +ENSE00003685083 +ENSE00003653006 +ENSE00001866903 +ENSE00003492457 +ENSE00001896684 +ENSE00003669982 +ENSE00001839399 +ENSE00003387437 +ENSE00003480267 +ENSE00003485438 +ENSE00001857368 +ENSE00000734306 +ENSE00000734303 +ENSE00001854631 +ENSE00000734299 +ENSE00001931622 +ENSE00003566716 +ENSE00003677298 +ENSE00001870155 +ENSE00001477063 +ENSE00001680820 +ENSE00001748742 +ENSE00001836154 +ENSE00001858739 +ENSE00001475277 +ENSE00001475269 +ENSE00001890428 +ENSE00001475263 +ENSE00001948071 +ENSE00001854189 +ENSE00001914446 +ENSE00000734533 +ENSE00002817476 +ENSE00001916716 +ENSE00001475267 +ENSE00001475271 +ENSE00001835288 +ENSE00001475281 +ENSE00001150483 +ENSE00003790229 +ENSE00001500136 +ENSE00003787977 +ENSE00001658885 +ENSE00001670416 diff --git a/pygtftk/data/mini_real_10M/ids_plus.gtf b/pygtftk/data/mini_real_10M/ids_plus.gtf new file mode 100644 index 00000000..5a257963 --- /dev/null +++ b/pygtftk/data/mini_real_10M/ids_plus.gtf @@ -0,0 +1,468 @@ +chr1 havana five_prime_utr 1001145 1001263 0 + -1 gene_id "ENSG00000187608"; transcript_id "ENST00000624652"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "ISG15"; +chr1 havana transcript 1001145 1014435 0 + -1 gene_id "ENSG00000187608"; transcript_id "ENST00000624652"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "ISG15"; +chr1 havana exon 1001145 1001263 0 + -1 gene_id "ENSG00000187608"; transcript_id "ENST00000624652"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003755319"; gene_name "ISG15"; +chr1 havana exon 1008194 1008279 0 + -1 gene_id "ENSG00000187608"; transcript_id "ENST00000624652"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003755395"; gene_name "ISG15"; +chr1 havana five_prime_utr 1008194 1008279 0 + -1 gene_id "ENSG00000187608"; transcript_id "ENST00000624652"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "ISG15"; +chr1 ensembl_havana five_prime_utr 1013423 1013573 0 + -1 gene_id "ENSG00000187608"; transcript_id "ENST00000379389"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS6"; gene_name "ISG15"; +chr1 ensembl_havana exon 1013423 1013576 0 + -1 gene_id "ENSG00000187608"; transcript_id "ENST00000379389"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS6"; exon_id "ENSE00001480807"; gene_name "ISG15"; +chr1 ensembl_havana transcript 1013423 1014540 0 + -1 gene_id "ENSG00000187608"; transcript_id "ENST00000379389"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS6"; gene_name "ISG15"; +chr1 ensembl_havana CDS 1013574 1013576 0 + 0 gene_id "ENSG00000187608"; transcript_id "ENST00000379389"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS6"; protein_id "ENSP00000368699"; gene_name "ISG15"; +chr1 ensembl_havana start_codon 1013574 1013576 0 + 0 gene_id "ENSG00000187608"; transcript_id "ENST00000379389"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS6"; gene_name "ISG15"; +chr1 ensembl_havana exon 1013984 1014540 0 + -1 gene_id "ENSG00000187608"; transcript_id "ENST00000379389"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS6"; exon_id "ENSE00001480799"; gene_name "ISG15"; +chr1 havana exon 1013984 1014435 0 + -1 gene_id "ENSG00000187608"; transcript_id "ENST00000624652"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003756535"; gene_name "ISG15"; +chr1 havana five_prime_utr 1013984 1014004 0 + -1 gene_id "ENSG00000187608"; transcript_id "ENST00000624652"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "ISG15"; +chr1 ensembl_havana CDS 1013984 1014475 0 + 0 gene_id "ENSG00000187608"; transcript_id "ENST00000379389"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS6"; protein_id "ENSP00000368699"; gene_name "ISG15"; +chr1 havana start_codon 1014005 1014007 0 + 0 gene_id "ENSG00000187608"; transcript_id "ENST00000624652"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "ISG15"; +chr1 havana CDS 1014005 1014435 0 + 0 gene_id "ENSG00000187608"; transcript_id "ENST00000624652"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000485313"; gene_name "ISG15"; +chr1 ensembl_havana stop_codon 1014476 1014478 0 + 0 gene_id "ENSG00000187608"; transcript_id "ENST00000379389"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS6"; gene_name "ISG15"; +chr1 ensembl_havana three_prime_utr 1014479 1014540 0 + -1 gene_id "ENSG00000187608"; transcript_id "ENST00000379389"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS6"; gene_name "ISG15"; +chr1 havana transcript 2425980 2479804 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000609981"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 havana exon 2425980 2426037 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000609981"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001648978"; gene_name "PLCH2"; +chr1 havana five_prime_utr 2425980 2426037 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000609981"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 havana exon 2430338 2430629 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000609981"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001621165"; gene_name "PLCH2"; +chr1 havana five_prime_utr 2430338 2430514 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000609981"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 havana start_codon 2430515 2430517 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000609981"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 havana CDS 2430515 2430629 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000609981"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000476436"; gene_name "PLCH2"; +chr1 havana exon 2467459 2467662 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001780479"; gene_name "PLCH2"; +chr1 havana five_prime_utr 2467459 2467619 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 havana transcript 2467459 2505526 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 havana CDS 2467620 2467662 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana start_codon 2467620 2467622 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 havana transcript 2476315 2505525 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 havana five_prime_utr 2476315 2476588 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 ensembl five_prime_utr 2476315 2476588 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; gene_name "PLCH2"; +chr1 ensembl exon 2476315 2476712 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003473982"; gene_name "PLCH2"; +chr1 havana exon 2476315 2476712 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003473982"; gene_name "PLCH2"; +chr1 ensembl transcript 2476315 2505525 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; gene_name "PLCH2"; +chr1 havana CDS 2476589 2476712 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana start_codon 2476589 2476591 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 ensembl start_codon 2476589 2476591 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; gene_name "PLCH2"; +chr1 ensembl CDS 2476589 2476712 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana CDS 2478476 2478622 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana CDS 2478476 2478622 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana exon 2478476 2478622 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003499259"; gene_name "PLCH2"; +chr1 havana exon 2478476 2478622 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000609981"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003499259"; gene_name "PLCH2"; +chr1 havana exon 2478476 2478622 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003499259"; gene_name "PLCH2"; +chr1 ensembl exon 2478476 2478622 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003499259"; gene_name "PLCH2"; +chr1 ensembl CDS 2478476 2478622 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana CDS 2478476 2478622 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000609981"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000476436"; gene_name "PLCH2"; +chr1 havana transcript 2479090 2505530 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; gene_name "PLCH2"; +chr1 havana exon 2479090 2479978 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001477669"; gene_name "PLCH2"; +chr1 havana exon 2479734 2479804 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000609981"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001477672"; gene_name "PLCH2"; +chr1 havana exon 2479734 2479978 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001400676"; gene_name "PLCH2"; +chr1 ensembl exon 2479734 2479977 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00001477687"; gene_name "PLCH2"; +chr1 havana CDS 2479734 2479804 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000609981"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000476436"; gene_name "PLCH2"; +chr1 havana exon 2479734 2479978 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001400676"; gene_name "PLCH2"; +chr1 havana CDS 2479734 2479978 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana CDS 2479734 2479978 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 ensembl CDS 2479734 2479977 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana transcript 2479888 2505276 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 havana exon 2479888 2479978 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001376863"; gene_name "PLCH2"; +chr1 havana CDS 2479888 2479978 0 + 1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 ensembl CDS 2480183 2480312 0 + 1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 ensembl exon 2480183 2480312 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00001477685"; gene_name "PLCH2"; +chr1 havana exon 2480184 2480312 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003553212"; gene_name "PLCH2"; +chr1 havana exon 2480184 2480312 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003553212"; gene_name "PLCH2"; +chr1 havana CDS 2480184 2480312 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana CDS 2480184 2480312 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana exon 2480184 2480312 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003470263"; gene_name "PLCH2"; +chr1 havana CDS 2480184 2480312 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana exon 2480184 2480312 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003553212"; gene_name "PLCH2"; +chr1 havana exon 2484448 2484618 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003472793"; gene_name "PLCH2"; +chr1 havana CDS 2484448 2484618 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana exon 2484448 2484618 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003472793"; gene_name "PLCH2"; +chr1 havana exon 2484448 2484618 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003647310"; gene_name "PLCH2"; +chr1 havana CDS 2484448 2484618 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana exon 2484448 2484618 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003472793"; gene_name "PLCH2"; +chr1 ensembl exon 2484448 2484618 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003472793"; gene_name "PLCH2"; +chr1 ensembl CDS 2484448 2484618 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana CDS 2484448 2484618 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 ensembl CDS 2486907 2487000 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana exon 2486907 2487000 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003465003"; gene_name "PLCH2"; +chr1 havana exon 2486907 2487000 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003465003"; gene_name "PLCH2"; +chr1 havana CDS 2486907 2487000 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 ensembl exon 2486907 2487000 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003465003"; gene_name "PLCH2"; +chr1 havana exon 2486907 2487000 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003649862"; gene_name "PLCH2"; +chr1 havana CDS 2486907 2487000 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana exon 2486907 2487000 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003465003"; gene_name "PLCH2"; +chr1 havana CDS 2486907 2487000 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana exon 2487173 2487376 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003688902"; gene_name "PLCH2"; +chr1 havana CDS 2487173 2487376 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana CDS 2487173 2487376 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana exon 2487173 2487376 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003533538"; gene_name "PLCH2"; +chr1 havana exon 2487173 2487376 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003688902"; gene_name "PLCH2"; +chr1 havana CDS 2487173 2487376 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana exon 2487173 2487376 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003688902"; gene_name "PLCH2"; +chr1 ensembl exon 2487173 2487376 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003688902"; gene_name "PLCH2"; +chr1 ensembl CDS 2487173 2487376 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana CDS 2487598 2487718 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana CDS 2487598 2487718 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana CDS 2487598 2487718 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana exon 2487598 2487718 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003546186"; gene_name "PLCH2"; +chr1 havana exon 2487598 2487718 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003552203"; gene_name "PLCH2"; +chr1 havana exon 2487598 2487718 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003552203"; gene_name "PLCH2"; +chr1 ensembl CDS 2487598 2487718 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 ensembl exon 2487598 2487718 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003552203"; gene_name "PLCH2"; +chr1 havana exon 2487598 2487718 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003552203"; gene_name "PLCH2"; +chr1 ensembl exon 2489207 2489378 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003472855"; gene_name "PLCH2"; +chr1 havana exon 2489207 2489378 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003472855"; gene_name "PLCH2"; +chr1 havana exon 2489207 2489378 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003472855"; gene_name "PLCH2"; +chr1 havana CDS 2489207 2489378 0 + 1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 ensembl CDS 2489207 2489378 0 + 1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana CDS 2489207 2489378 0 + 1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana exon 2489207 2489378 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003605114"; gene_name "PLCH2"; +chr1 havana exon 2489207 2489378 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003472855"; gene_name "PLCH2"; +chr1 havana CDS 2489207 2489378 0 + 1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana exon 2489760 2489867 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003517403"; gene_name "PLCH2"; +chr1 havana CDS 2489760 2489867 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana exon 2489760 2489867 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003517403"; gene_name "PLCH2"; +chr1 ensembl CDS 2489760 2489867 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 ensembl exon 2489760 2489867 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003517403"; gene_name "PLCH2"; +chr1 havana CDS 2489760 2489867 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana exon 2489760 2489867 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003517403"; gene_name "PLCH2"; +chr1 havana CDS 2489760 2489867 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana exon 2489760 2489867 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003655153"; gene_name "PLCH2"; +chr1 havana exon 2491192 2491335 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003582994"; gene_name "PLCH2"; +chr1 ensembl CDS 2491192 2491335 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana CDS 2491192 2491335 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana CDS 2491192 2491335 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana exon 2491192 2491335 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003582994"; gene_name "PLCH2"; +chr1 havana exon 2491192 2491335 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003582994"; gene_name "PLCH2"; +chr1 havana CDS 2491192 2491335 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana exon 2491192 2491335 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003543912"; gene_name "PLCH2"; +chr1 ensembl exon 2491192 2491335 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003582994"; gene_name "PLCH2"; +chr1 havana CDS 2494856 2494948 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 ensembl exon 2494856 2494948 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003684947"; gene_name "PLCH2"; +chr1 ensembl CDS 2494856 2494948 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana exon 2494856 2494948 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003557083"; gene_name "PLCH2"; +chr1 havana CDS 2494856 2494948 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana exon 2494856 2494948 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003684947"; gene_name "PLCH2"; +chr1 havana exon 2494856 2494948 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003684947"; gene_name "PLCH2"; +chr1 havana exon 2494856 2494948 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003684947"; gene_name "PLCH2"; +chr1 havana CDS 2494856 2494948 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana CDS 2495488 2495570 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana exon 2495488 2495570 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003535221"; gene_name "PLCH2"; +chr1 havana exon 2495488 2495570 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003534549"; gene_name "PLCH2"; +chr1 ensembl CDS 2495488 2495570 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana exon 2495488 2495570 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003535221"; gene_name "PLCH2"; +chr1 havana CDS 2495488 2495570 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 ensembl exon 2495488 2495570 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003535221"; gene_name "PLCH2"; +chr1 havana CDS 2495488 2495570 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana exon 2495488 2495570 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003535221"; gene_name "PLCH2"; +chr1 havana CDS 2496607 2496704 0 + 1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana exon 2496607 2496704 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003559057"; gene_name "PLCH2"; +chr1 havana exon 2496607 2496704 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003559057"; gene_name "PLCH2"; +chr1 havana CDS 2496607 2496704 0 + 1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 ensembl exon 2496607 2496704 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003559057"; gene_name "PLCH2"; +chr1 ensembl CDS 2496607 2496704 0 + 1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana CDS 2496607 2496704 0 + 1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana exon 2496607 2496704 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003559057"; gene_name "PLCH2"; +chr1 havana exon 2496607 2496704 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003650873"; gene_name "PLCH2"; +chr1 ensembl exon 2496828 2497010 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003516954"; gene_name "PLCH2"; +chr1 havana exon 2496828 2497010 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003534507"; gene_name "PLCH2"; +chr1 havana CDS 2496828 2497010 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 ensembl CDS 2496828 2497010 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana exon 2496828 2497010 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003516954"; gene_name "PLCH2"; +chr1 havana CDS 2496828 2497010 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana exon 2496828 2497010 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003516954"; gene_name "PLCH2"; +chr1 havana exon 2496828 2497010 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003516954"; gene_name "PLCH2"; +chr1 havana CDS 2496828 2497010 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana exon 2497502 2497609 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003616922"; gene_name "PLCH2"; +chr1 havana CDS 2497502 2497609 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 ensembl CDS 2497502 2497609 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana exon 2497502 2497609 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003591218"; gene_name "PLCH2"; +chr1 ensembl exon 2497502 2497609 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003616922"; gene_name "PLCH2"; +chr1 havana exon 2497502 2497609 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003616922"; gene_name "PLCH2"; +chr1 havana CDS 2497502 2497609 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana exon 2497782 2498647 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000473964"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001940753"; gene_name "PLCH2"; +chr1 havana transcript 2497782 2505528 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000473964"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; gene_name "PLCH2"; +chr1 havana CDS 2498523 2498647 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana exon 2498523 2498647 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003653363"; gene_name "PLCH2"; +chr1 havana CDS 2498523 2498647 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana CDS 2498523 2498647 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana exon 2498523 2498647 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003653363"; gene_name "PLCH2"; +chr1 havana exon 2498523 2498647 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003541907"; gene_name "PLCH2"; +chr1 havana exon 2498523 2498647 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003653363"; gene_name "PLCH2"; +chr1 ensembl exon 2498523 2498647 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003653363"; gene_name "PLCH2"; +chr1 ensembl CDS 2498523 2498647 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana exon 2498647 2498828 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000462379"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001923708"; gene_name "PLCH2"; +chr1 havana transcript 2498647 2505528 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000462379"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; gene_name "PLCH2"; +chr1 havana CDS 2498744 2498828 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana exon 2498744 2498828 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003492751"; gene_name "PLCH2"; +chr1 havana CDS 2498744 2498828 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana exon 2498744 2498828 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003466854"; gene_name "PLCH2"; +chr1 havana exon 2498744 2498828 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003492751"; gene_name "PLCH2"; +chr1 havana CDS 2498744 2498828 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana exon 2498744 2498828 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000473964"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003466854"; gene_name "PLCH2"; +chr1 ensembl CDS 2498744 2498828 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana exon 2498744 2498828 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003492751"; gene_name "PLCH2"; +chr1 ensembl exon 2498744 2498828 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003492751"; gene_name "PLCH2"; +chr1 ensembl CDS 2499084 2499230 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana exon 2499084 2499230 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000473964"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003571083"; gene_name "PLCH2"; +chr1 havana exon 2499084 2499230 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000462379"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003571083"; gene_name "PLCH2"; +chr1 havana CDS 2499084 2499230 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana exon 2499084 2499230 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003685158"; gene_name "PLCH2"; +chr1 ensembl exon 2499084 2499230 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003685158"; gene_name "PLCH2"; +chr1 havana CDS 2499084 2499230 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana exon 2499084 2499230 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003685158"; gene_name "PLCH2"; +chr1 havana exon 2499084 2499230 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003571083"; gene_name "PLCH2"; +chr1 havana CDS 2499084 2499230 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana exon 2499084 2499230 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003685158"; gene_name "PLCH2"; +chr1 havana exon 2499641 2499720 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003658295"; gene_name "PLCH2"; +chr1 havana exon 2499641 2499720 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003658295"; gene_name "PLCH2"; +chr1 havana CDS 2499641 2499720 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana exon 2499641 2505528 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000473964"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001826643"; gene_name "PLCH2"; +chr1 ensembl exon 2499641 2499720 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003658295"; gene_name "PLCH2"; +chr1 havana CDS 2499641 2499720 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana exon 2499641 2499720 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000462379"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003609797"; gene_name "PLCH2"; +chr1 havana exon 2499641 2499720 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003658295"; gene_name "PLCH2"; +chr1 havana CDS 2499641 2499720 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 ensembl CDS 2499641 2499720 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana exon 2499641 2499720 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003609797"; gene_name "PLCH2"; +chr1 havana exon 2502112 2502409 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003596489"; gene_name "PLCH2"; +chr1 havana exon 2502112 2505530 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000343889"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001432737"; gene_name "PLCH2"; +chr1 havana CDS 2502112 2502910 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana exon 2502112 2502910 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001697293"; gene_name "PLCH2"; +chr1 havana CDS 2502112 2502409 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana CDS 2502112 2502409 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana exon 2502112 2502409 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000462379"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003540997"; gene_name "PLCH2"; +chr1 havana exon 2502112 2502409 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003596489"; gene_name "PLCH2"; +chr1 ensembl exon 2502112 2502409 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00003596489"; gene_name "PLCH2"; +chr1 ensembl CDS 2502112 2502409 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 havana CDS 2503617 2503624 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000397289"; gene_name "PLCH2"; +chr1 havana exon 2503617 2505526 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001701479"; gene_name "PLCH2"; +chr1 havana exon 2503617 2503643 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000462379"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001834994"; gene_name "PLCH2"; +chr1 havana stop_codon 2503625 2503627 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 havana three_prime_utr 2503628 2505526 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000449969"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 havana exon 2503922 2505528 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000462379"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00001887073"; gene_name "PLCH2"; +chr1 havana exon 2503922 2505276 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001783927"; gene_name "PLCH2"; +chr1 havana CDS 2503922 2505210 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000278878"; gene_name "PLCH2"; +chr1 havana exon 2503922 2505525 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001420069"; gene_name "PLCH2"; +chr1 ensembl CDS 2503922 2505210 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; protein_id "ENSP00000367747"; gene_name "PLCH2"; +chr1 ensembl exon 2503922 2505525 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; exon_id "ENSE00001420069"; gene_name "PLCH2"; +chr1 havana CDS 2503922 2505210 0 + 2 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000389803"; gene_name "PLCH2"; +chr1 havana stop_codon 2505211 2505213 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 havana stop_codon 2505211 2505213 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 ensembl stop_codon 2505211 2505213 0 + 0 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; gene_name "PLCH2"; +chr1 havana three_prime_utr 2505214 2505525 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000419816"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 ensembl three_prime_utr 2505214 2505525 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000378486"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS59959"; gene_name "PLCH2"; +chr1 havana three_prime_utr 2505214 2505276 0 + -1 gene_id "ENSG00000149527"; transcript_id "ENST00000278878"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PLCH2"; +chr1 havana transcript 3069168 3434342 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 havana exon 3069168 3069296 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00002048533"; gene_name "PRDM16"; +chr1 havana five_prime_utr 3069168 3069259 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 havana transcript 3069183 3186591 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000607632"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; gene_name "PRDM16"; +chr1 havana exon 3069183 3069296 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000607632"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003700259"; gene_name "PRDM16"; +chr1 havana transcript 3069197 3435421 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; gene_name "PRDM16"; +chr1 havana exon 3069197 3069296 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00001222906"; gene_name "PRDM16"; +chr1 havana five_prime_utr 3069197 3069259 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; gene_name "PRDM16"; +chr1 havana transcript 3069211 3434342 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 havana five_prime_utr 3069211 3069259 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 ensembl_havana transcript 3069211 3438621 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3069211 3069296 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00001598723"; gene_name "PRDM16"; +chr1 ensembl_havana five_prime_utr 3069211 3069259 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; gene_name "PRDM16"; +chr1 havana exon 3069211 3069296 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001598723"; gene_name "PRDM16"; +chr1 havana start_codon 3069260 3069262 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; gene_name "PRDM16"; +chr1 havana CDS 3069260 3069296 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 ensembl_havana start_codon 3069260 3069262 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; gene_name "PRDM16"; +chr1 havana CDS 3069260 3069296 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 havana start_codon 3069260 3069262 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3069260 3069296 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 havana CDS 3069260 3069296 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 havana start_codon 3069260 3069262 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 havana exon 3186125 3186591 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000607632"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003695128"; gene_name "PRDM16"; +chr1 havana exon 3186125 3186474 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001754112"; gene_name "PRDM16"; +chr1 havana CDS 3186125 3186474 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 havana exon 3186125 3186474 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00001754112"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3186125 3186474 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3186125 3186474 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00001754112"; gene_name "PRDM16"; +chr1 havana CDS 3186125 3186474 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 havana CDS 3186125 3186474 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 havana exon 3186125 3186474 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001754112"; gene_name "PRDM16"; +chr1 havana exon 3237931 3238095 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00002087812"; gene_name "PRDM16"; +chr1 havana transcript 3237931 3433925 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; gene_name "PRDM16"; +chr1 havana exon 3244087 3244137 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003480863"; gene_name "PRDM16"; +chr1 havana CDS 3244087 3244137 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 havana exon 3244087 3244137 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003516886"; gene_name "PRDM16"; +chr1 havana exon 3244087 3244137 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003480863"; gene_name "PRDM16"; +chr1 havana CDS 3244087 3244137 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 havana CDS 3244087 3244137 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 havana exon 3244087 3244137 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00003480863"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3244087 3244137 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00003480863"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3244087 3244137 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 havana CDS 3244132 3244137 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000463591"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000476002"; gene_name "PRDM16"; +chr1 havana transcript 3244132 3386918 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000463591"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 havana exon 3244132 3244137 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000463591"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001882136"; gene_name "PRDM16"; +chr1 havana CDS 3385149 3385286 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 havana exon 3385149 3385286 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00002034212"; gene_name "PRDM16"; +chr1 havana exon 3385149 3385286 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00002034212"; gene_name "PRDM16"; +chr1 havana CDS 3385149 3385286 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 havana CDS 3385152 3385286 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 havana exon 3385152 3385286 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000463591"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003695725"; gene_name "PRDM16"; +chr1 havana CDS 3385152 3385286 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000463591"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000476002"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3385152 3385286 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00003695725"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3385152 3385286 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 havana exon 3385152 3385286 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003662380"; gene_name "PRDM16"; +chr1 havana exon 3385152 3385286 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00003695725"; gene_name "PRDM16"; +chr1 havana CDS 3386676 3386693 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000463591"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000476002"; gene_name "PRDM16"; +chr1 havana exon 3386676 3386918 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000463591"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001846205"; gene_name "PRDM16"; +chr1 havana stop_codon 3386694 3386696 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000463591"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 havana three_prime_utr 3386697 3386918 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000463591"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 havana CDS 3396491 3396593 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000425796"; gene_name "PRDM16"; +chr1 havana exon 3396491 3396593 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003697266"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3396491 3396593 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 havana CDS 3396491 3396593 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 havana exon 3396491 3396593 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00003700221"; gene_name "PRDM16"; +chr1 havana CDS 3396491 3396593 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 havana exon 3396491 3396593 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003700221"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3396491 3396593 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00003700221"; gene_name "PRDM16"; +chr1 havana exon 3396491 3396593 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003700221"; gene_name "PRDM16"; +chr1 havana CDS 3396491 3396593 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 havana transcript 3396491 3434293 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 havana exon 3396491 3396593 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003700221"; gene_name "PRDM16"; +chr1 havana exon 3402791 3402998 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003696962"; gene_name "PRDM16"; +chr1 havana exon 3402791 3402998 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003696962"; gene_name "PRDM16"; +chr1 havana CDS 3402791 3402998 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000425796"; gene_name "PRDM16"; +chr1 havana exon 3402791 3402998 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003701239"; gene_name "PRDM16"; +chr1 havana exon 3402791 3402998 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003696962"; gene_name "PRDM16"; +chr1 havana CDS 3402791 3402998 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 havana exon 3402791 3402998 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00003696962"; gene_name "PRDM16"; +chr1 havana CDS 3402791 3402998 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 havana CDS 3402791 3402998 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3402791 3402998 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00003696962"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3402791 3402998 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3404739 3404886 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00003700688"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3404739 3404886 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 havana exon 3404739 3404886 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00003700688"; gene_name "PRDM16"; +chr1 havana CDS 3404739 3404886 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000425796"; gene_name "PRDM16"; +chr1 havana CDS 3404739 3404886 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 havana CDS 3404739 3404886 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 havana exon 3404739 3404886 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003700688"; gene_name "PRDM16"; +chr1 havana exon 3404739 3404886 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003700688"; gene_name "PRDM16"; +chr1 havana CDS 3404739 3404886 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 havana exon 3404739 3404886 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003700436"; gene_name "PRDM16"; +chr1 havana exon 3404739 3404886 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003700688"; gene_name "PRDM16"; +chr1 havana exon 3405495 3405648 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003700645"; gene_name "PRDM16"; +chr1 havana exon 3405495 3405648 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003700645"; gene_name "PRDM16"; +chr1 havana CDS 3405495 3405648 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 havana CDS 3405495 3405648 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 havana exon 3405495 3405648 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00003700645"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3405495 3405648 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00003700645"; gene_name "PRDM16"; +chr1 havana exon 3405495 3405648 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003695760"; gene_name "PRDM16"; +chr1 havana exon 3405495 3405648 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003700645"; gene_name "PRDM16"; +chr1 havana CDS 3405495 3405648 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3405495 3405648 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 havana CDS 3405495 3405648 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000425796"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3411384 3412800 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3411384 3412800 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00003695658"; gene_name "PRDM16"; +chr1 havana CDS 3411384 3412800 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 havana exon 3411384 3412800 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003695658"; gene_name "PRDM16"; +chr1 havana CDS 3411384 3412800 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000425796"; gene_name "PRDM16"; +chr1 havana exon 3411384 3412800 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003695658"; gene_name "PRDM16"; +chr1 havana exon 3411384 3412800 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003699089"; gene_name "PRDM16"; +chr1 havana CDS 3411384 3412800 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 havana exon 3411384 3412800 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003695658"; gene_name "PRDM16"; +chr1 havana exon 3411384 3412800 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00003695658"; gene_name "PRDM16"; +chr1 havana CDS 3411384 3412800 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 havana exon 3414560 3414647 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003702178"; gene_name "PRDM16"; +chr1 havana exon 3414560 3414647 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003701451"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3414560 3414647 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00003701451"; gene_name "PRDM16"; +chr1 havana CDS 3414560 3414647 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3414560 3414647 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 havana CDS 3414560 3414647 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 havana exon 3414560 3414647 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00003701451"; gene_name "PRDM16"; +chr1 havana exon 3414563 3414647 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001582537"; gene_name "PRDM16"; +chr1 havana CDS 3414563 3414647 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 havana exon 3414563 3414647 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001582537"; gene_name "PRDM16"; +chr1 havana CDS 3414563 3414647 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000425796"; gene_name "PRDM16"; +chr1 havana exon 3417828 3417997 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00003699052"; gene_name "PRDM16"; +chr1 havana CDS 3417828 3417997 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 havana exon 3417828 3417997 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003699052"; gene_name "PRDM16"; +chr1 havana exon 3417828 3417997 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003699052"; gene_name "PRDM16"; +chr1 havana CDS 3417828 3417997 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 havana exon 3417828 3417997 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003699052"; gene_name "PRDM16"; +chr1 havana CDS 3417828 3417997 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000425796"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3417828 3417997 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3417828 3417997 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00003699052"; gene_name "PRDM16"; +chr1 havana CDS 3417828 3417997 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 havana exon 3417828 3417997 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003701293"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3418667 3418744 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 havana exon 3418667 3418744 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003697785"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3418667 3418744 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00003698430"; gene_name "PRDM16"; +chr1 havana CDS 3418667 3418744 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 havana exon 3418667 3418744 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00003698430"; gene_name "PRDM16"; +chr1 havana exon 3418667 3418744 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003698430"; gene_name "PRDM16"; +chr1 havana exon 3418667 3418744 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003698430"; gene_name "PRDM16"; +chr1 havana CDS 3418667 3418744 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 havana CDS 3418667 3418744 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000425796"; gene_name "PRDM16"; +chr1 havana exon 3418667 3418744 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003698430"; gene_name "PRDM16"; +chr1 havana CDS 3418667 3418744 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 havana transcript 3424919 3434095 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378389"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; gene_name "PRDM16"; +chr1 havana exon 3424919 3425059 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378389"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001905893"; gene_name "PRDM16"; +chr1 havana exon 3425216 3425750 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000606170"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003697875"; gene_name "PRDM16"; +chr1 havana transcript 3425216 3426072 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000606170"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; gene_name "PRDM16"; +chr1 havana exon 3425581 3425750 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003699796"; gene_name "PRDM16"; +chr1 havana exon 3425581 3425750 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00003699796"; gene_name "PRDM16"; +chr1 havana CDS 3425581 3425750 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000425796"; gene_name "PRDM16"; +chr1 havana exon 3425581 3425750 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003699796"; gene_name "PRDM16"; +chr1 havana CDS 3425581 3425750 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 havana exon 3425581 3425750 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003701636"; gene_name "PRDM16"; +chr1 havana exon 3425581 3425750 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378389"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003701636"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3425581 3425750 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 havana CDS 3425581 3425750 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3425581 3425750 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00003699796"; gene_name "PRDM16"; +chr1 havana exon 3425581 3425750 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003699796"; gene_name "PRDM16"; +chr1 havana CDS 3425581 3425750 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 havana exon 3426051 3426225 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00003701891"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3426051 3426225 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00003701891"; gene_name "PRDM16"; +chr1 havana exon 3426051 3426225 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003701891"; gene_name "PRDM16"; +chr1 havana exon 3426051 3426225 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003696062"; gene_name "PRDM16"; +chr1 havana exon 3426051 3426072 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000606170"; gene_biotype "protein_coding"; transcript_biotype "retained_intron"; exon_id "ENSE00003700534"; gene_name "PRDM16"; +chr1 havana exon 3426051 3426225 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378389"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003696062"; gene_name "PRDM16"; +chr1 havana exon 3426051 3426225 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003701891"; gene_name "PRDM16"; +chr1 havana CDS 3426051 3426225 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 havana CDS 3426051 3426225 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 havana CDS 3426051 3426225 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000425796"; gene_name "PRDM16"; +chr1 havana CDS 3426051 3426225 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 havana exon 3426051 3426225 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003701891"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3426051 3426225 0 + 2 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 havana exon 3430872 3431108 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003698226"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3430872 3431108 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00003698226"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3430872 3431108 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 havana exon 3430872 3431108 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003698226"; gene_name "PRDM16"; +chr1 havana exon 3430872 3431108 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00003698226"; gene_name "PRDM16"; +chr1 havana CDS 3430872 3431108 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 havana exon 3430872 3431108 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003698226"; gene_name "PRDM16"; +chr1 havana CDS 3430872 3431108 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000425796"; gene_name "PRDM16"; +chr1 havana exon 3430872 3431108 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378389"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003697832"; gene_name "PRDM16"; +chr1 havana exon 3430872 3431108 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003697832"; gene_name "PRDM16"; +chr1 havana CDS 3430872 3431108 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 havana CDS 3430872 3431108 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 havana exon 3431966 3432140 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00003700833"; gene_name "PRDM16"; +chr1 havana CDS 3431966 3432140 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 havana exon 3431966 3432140 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00003700833"; gene_name "PRDM16"; +chr1 havana exon 3431966 3432140 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00003698886"; gene_name "PRDM16"; +chr1 havana CDS 3431966 3432140 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000425796"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3431966 3432140 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3431966 3432140 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00003700833"; gene_name "PRDM16"; +chr1 havana exon 3433677 3434342 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00002081080"; gene_name "PRDM16"; +chr1 havana exon 3433677 3433925 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000512462"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00002068021"; gene_name "PRDM16"; +chr1 havana CDS 3433677 3433686 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000426975"; gene_name "PRDM16"; +chr1 ensembl_havana CDS 3433677 3433808 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; protein_id "ENSP00000270722"; gene_name "PRDM16"; +chr1 havana CDS 3433677 3433808 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000425796"; gene_name "PRDM16"; +chr1 havana CDS 3433677 3433686 0 + 1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; protein_id "ENSP00000421400"; gene_name "PRDM16"; +chr1 ensembl_havana exon 3433677 3438621 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; exon_id "ENSE00001759023"; gene_name "PRDM16"; +chr1 havana exon 3433677 3434095 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378389"; gene_biotype "protein_coding"; transcript_biotype "processed_transcript"; exon_id "ENSE00001875784"; gene_name "PRDM16"; +chr1 havana exon 3433677 3434342 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00002081080"; gene_name "PRDM16"; +chr1 havana exon 3433677 3434293 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; exon_id "ENSE00001477317"; gene_name "PRDM16"; +chr1 havana stop_codon 3433687 3433689 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 havana stop_codon 3433687 3433689 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 havana three_prime_utr 3433690 3434342 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000511072"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 havana three_prime_utr 3433690 3434342 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000514189"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 havana exon 3433734 3435421 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; exon_id "ENSE00001477303"; gene_name "PRDM16"; +chr1 havana CDS 3433734 3433808 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; protein_id "ENSP00000367643"; gene_name "PRDM16"; +chr1 ensembl_havana stop_codon 3433809 3433811 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; gene_name "PRDM16"; +chr1 havana stop_codon 3433809 3433811 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 havana stop_codon 3433809 3433811 0 + 0 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; gene_name "PRDM16"; +chr1 havana three_prime_utr 3433812 3434293 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000509860"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; gene_name "PRDM16"; +chr1 ensembl_havana three_prime_utr 3433812 3438621 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000270722"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS41236"; gene_name "PRDM16"; +chr1 havana three_prime_utr 3433812 3435421 0 + -1 gene_id "ENSG00000142611"; transcript_id "ENST00000378391"; gene_biotype "protein_coding"; transcript_biotype "protein_coding"; ccds_id "CCDS44048"; gene_name "PRDM16"; diff --git a/pygtftk/data/mini_real_10M/ids_plus.txt b/pygtftk/data/mini_real_10M/ids_plus.txt new file mode 100644 index 00000000..a730067e --- /dev/null +++ b/pygtftk/data/mini_real_10M/ids_plus.txt @@ -0,0 +1,21 @@ +ENST00000624697 +ENST00000624652 +ENST00000379389 +ENST00000609981 +ENST00000449969 +ENST00000419816 +ENST00000378486 +ENST00000343889 +ENST00000278878 +ENST00000473964 +ENST00000462379 +ENST00000511072 +ENST00000607632 +ENST00000378391 +ENST00000514189 +ENST00000270722 +ENST00000512462 +ENST00000463591 +ENST00000509860 +ENST00000378389 +ENST00000606170 diff --git a/pygtftk/data/mini_real_10M/ids_plus_exon.txt b/pygtftk/data/mini_real_10M/ids_plus_exon.txt new file mode 100644 index 00000000..1d99501e --- /dev/null +++ b/pygtftk/data/mini_real_10M/ids_plus_exon.txt @@ -0,0 +1,111 @@ +ENSE00003759395 +ENSE00003755319 +ENSE00003755395 +ENSE00001480807 +ENSE00001480799 +ENSE00003756535 +ENSE00001648978 +ENSE00001621165 +ENSE00001780479 +ENSE00003473982 +ENSE00003499259 +ENSE00001477669 +ENSE00001477672 +ENSE00001400676 +ENSE00001477687 +ENSE00001376863 +ENSE00001477685 +ENSE00003553212 +ENSE00003470263 +ENSE00003472793 +ENSE00003647310 +ENSE00003465003 +ENSE00003649862 +ENSE00003688902 +ENSE00003533538 +ENSE00003546186 +ENSE00003552203 +ENSE00003472855 +ENSE00003605114 +ENSE00003517403 +ENSE00003655153 +ENSE00003582994 +ENSE00003543912 +ENSE00003684947 +ENSE00003557083 +ENSE00003535221 +ENSE00003534549 +ENSE00003559057 +ENSE00003650873 +ENSE00003516954 +ENSE00003534507 +ENSE00003616922 +ENSE00003591218 +ENSE00001940753 +ENSE00003653363 +ENSE00003541907 +ENSE00001923708 +ENSE00003492751 +ENSE00003466854 +ENSE00003571083 +ENSE00003685158 +ENSE00003658295 +ENSE00001826643 +ENSE00003609797 +ENSE00003596489 +ENSE00001432737 +ENSE00001697293 +ENSE00003540997 +ENSE00001701479 +ENSE00001834994 +ENSE00001887073 +ENSE00001783927 +ENSE00001420069 +ENSE00002048533 +ENSE00003700259 +ENSE00001222906 +ENSE00001598723 +ENSE00003695128 +ENSE00001754112 +ENSE00002087812 +ENSE00003480863 +ENSE00003516886 +ENSE00001882136 +ENSE00002034212 +ENSE00003695725 +ENSE00003662380 +ENSE00001846205 +ENSE00003697266 +ENSE00003700221 +ENSE00003696962 +ENSE00003701239 +ENSE00003700688 +ENSE00003700436 +ENSE00003700645 +ENSE00003695760 +ENSE00003695658 +ENSE00003699089 +ENSE00003702178 +ENSE00003701451 +ENSE00001582537 +ENSE00003699052 +ENSE00003701293 +ENSE00003697785 +ENSE00003698430 +ENSE00001905893 +ENSE00003697875 +ENSE00003699796 +ENSE00003701636 +ENSE00003701891 +ENSE00003696062 +ENSE00003700534 +ENSE00003698226 +ENSE00003697832 +ENSE00003700833 +ENSE00003698886 +ENSE00002081080 +ENSE00002068021 +ENSE00001759023 +ENSE00001875784 +ENSE00001477317 +ENSE00001477303 diff --git a/pygtftk/data/mini_real_10M/mini_real_10M.gtf.gz b/pygtftk/data/mini_real_10M/mini_real_10M.gtf.gz new file mode 100644 index 00000000..b1c4b930 Binary files /dev/null and b/pygtftk/data/mini_real_10M/mini_real_10M.gtf.gz differ diff --git a/pygtftk/data/mini_real_10M/observed_sequence_minus_exon_no_rv.fa b/pygtftk/data/mini_real_10M/observed_sequence_minus_exon_no_rv.fa new file mode 100644 index 00000000..2d2bf89b --- /dev/null +++ b/pygtftk/data/mini_real_10M/observed_sequence_minus_exon_no_rv.fa @@ -0,0 +1,1063 @@ +>ENSE00001611509 Reversed: +AAAGGCTGAGTCCTCTGAGAATTTATTACTACGGATCACAGCAGCAACGGGCGGGAAGGG +CGGCGCCAGACTCATTTGCCCCGCAGGTAGATCTTGGGGGTCTGCCAGCCTTCGGGGGCT +TCCTTTAGCCCCGCCTTCAGCCAGATGCGCCTCAGGTCTTTCTCGAACTTGAT +>ENSE00001790281 Reversed: +AGGCTGAGTCCTCTGAGAATTTATTACTACGGATCACAGCAGCAACGGGCGGGAAGGGCG +GCGCCAGACTCATTTGCCCCGCAGGTAGATCTTGGGGGTCTGCCAGCCTTCGGGGGCTTC +CTTTAGCCCCGCCTTCAGCCAGATGCGCCTCAGGTCTTTCTCGAACTTGAT +>ENSE00001842703 Reversed: +GAGTCCTCTGAGAATTTATTACTACGGATCACAGCAGCAACGGGCGGGAAGGGCGGCGCC +AGACTCATTTGCCCCGCAGGTAGATCTTGGGGGTCTGCCAGCCTTCGGGGGCTTCCTTTA +GCCCCGCCTTCAGCCAGATGCGCCTCAGGTCTTTCTCGAACTTGAT +>ENSE00001629775 Reversed: +CTGCTTGCGTCTCAGGCGTCCCTCCTGGACCTTCCTCCGCAGGAACCGCGTCTTCTTCAC +CAGCTTCCGGTACTTGTGGTGGTTCATCTTCCGCCGGCGGATCTTCAGCACGTTTTTGCA +CTGAATTTGAGGCGCATCCGCGACGCCTTCATCCCCCTGCTCGGCCCCTTCCCCTATCTG +GCTGGGCGGACACTGGTAGGATTGCGGTGGAGCCACAGTCCCTGCGGTCCCGGTATCCAG +TCTGGGCAGGAAGCAGCGGGCCGTGAGCCAGCTCTCCAGGGGGCTGACGGACATCTTCCT +GGGGACCAGCATCTCCTCCAGCTCCAGCTGGGCCCCCTTGCGAGGGAGAGAGGCCGCCCT +ACCTGGGCCGGCCGGCGATGTGCTGTAAAGGGGCCCGCAGACCCGGCTGCCCAGCACTCC +AGAGACGGGCCAAGGCGGGCGGCCGC +>ENSE00001922199 Reversed: +GGCAGGAAGCAGCGGGCCGTGAGCCAGCTCTCCAGGGGGCTGACGGACATCTTCCTGGGG +ACCAGCATCTCCTCCAGCTCCAGCTGGGCCCCCTTGCGAGGGAGAGAGGCCGCCCTACCT +GGGCCGGCCGGCGATGTGCTGTAAAGGGGCCCGCAGACCCGGCTGCCCAGCACTCCAGAG +ACGGGCCAAGGCGGGCGGCCGCCTGCAGAAAACCAGACGCCACGGTCACCGCTCGCGAGA +CCACACAGGCCCGTCGGGTTGAGGAGCAGCAGGTTCGTCCCAGCGAGGATCCCCCGCACC +TCATTCCTGGCCTGAACCCCTGAGGTTCCCTCTGTGAGCATCGGAAGCTTAGAGGGGAAA +GAGTGTGTGTGTGGCCACCGGCCCTGCCCCAGCGGAGCTGCTGAGACCCGCACTCCTAAC +CAGGTGTGCATCCTCCCATCCGCCCCCGCGCGGCTTCCTACCTGCCCAAGGAACGGCCCT +CAACAGCTGGGAAGTCAGGCGCCCCAGGAGCATGGTCTGTGGGCGGCGGCCACAGGTCCC +AGGGGAG +>ENSE00001821535 Reversed: +GCGGCCGCCTGCAGAAAACCAGACGCCACGGTCACCGCTCGCGAGACCACACAGGCCCGT +CGGGTTGAGGAGCAGCAGGTTCGTCCCAGCGAGGATCCCCCGCACCTCATTCCTGGCCTG +AACCCCTGAGGTTCCCTCTGTGAGCATCGGAAG +>ENSE00001789693 Reversed: +CTGCCCAAGGAACGGCCCTCAACAGCTGGGAAGTCAGGCGCCCCAGGAGCATGGTCTGTG +GGCGGCGGCCACAGGTCCCAGGGGAG +>ENSE00001896016 Reversed: +CTGCCCAAGGAACGGCCCTCAACAGCTGGGAAGTCAGGCGCCCCAGGAGCATGGTCTGTG +GGCGGCGGCCACAGGTCCCAGGGGAGCTGGAACACAAGTGCCCGTTCAGGTCAGGCGGCA +GCGCCTTCAGTAGTCGCGGGCGGGCCGGGACTGGGGCGTCTGGTCCCGCCGCGACCCTCG +CTTCCCTTCTCCCTCCGCCACCCCAACCCACAAGGAGGACTTTGCTTCCAACACAGCTCG +CGCCCCGAGGCTCCCAAGCCCCCGACGCGGGCGGTGTCGCGCTCGGACGCACCGAAAGGT +CCCAGAACGGGGAGGCCGGCCCCCTCCCCGGGTTCACCCCCGCGCGAATCGCGTTGCCTG +GCGCCCGGACCCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGCGCCCTCAG +GCCTCCCGCTGACCCTTCCCAAGCCCGACCTCGAC +>ENSE00001223521 Reversed: +CTGCCCAAGGAACGGCCCTCAACAGCTGGGAAGTCAGGCGCCCCAGGAGCATGGTCTGTG +GGCGGCGGCCACAGGTCCCAGGGGAGCTGGAACACAAGTGCCCGTTCAGGTCAGGCGGCA +GCGCCTTCAGTAGTCGCGGGCGGGCCGGGACTGGGGCGTCTGGTCCCGCCGCGACCCTCG +CTTCCCTTCTCCCTCCGCCACCCCAACCCACAAGGAGGACTTTGCTTCCAACACAGCTCG +CGCCCCGAGGCTCCCAAGCCCCCGACGCGGGCGGTGTCGCGCTCGGACGCACCGAAAGGT +CCCAGAACGGGGAGGCCGGCCCCCTCCCCGGGTTCACCCCCGCGCGAATCGCGTTGCCTG +GCGCCCGGACCCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGCGCCCTCAG +GCCTCCCGCTGACCCTTCCCAAGCCCGACCTCG +>ENSE00001921648 Reversed: +CGAAAGGTCCCAGAACGGGGAGGCCGGCCCCCTCCCCGGGTTCACCCCCGCGCGAATCGC +GTTGCCTGGCGCCCGGACCCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGC +GCCCTCAGGCCTCCCGCTGACCCTTCCC +>ENSE00001479025 Reversed: +CGAAAGGTCCCAGAACGGGGAGGCCGGCCCCCTCCCCGGGTTCACCCCCGCGCGAATCGC +GTTGCCTGGCGCCCGGACCCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGC +GCCCTCAGGCCTCCCGCTGACCCTTCCCAAGCCCGACCTCGACGCGGCTCAAATTGA +>ENSE00001479027 Reversed: +CCTCTCGGCTGGACCCCGGGCCCGCCTGCCGCAGCGCCCGGCGCCCTCAGGCCTCCCGCT +GACCCTTCCCAAGCCCGACCTCGACGCGGCTCAAA +>ENSE00001697866 Reversed: +CTCGACGCGGCTCAAATTGACCGTTCTGCGGCCGCCCTCGGGCACTTCCGGTCCGTCCCC +AAGTCGGCCCCGATCGGCAGCGGCCACCCGGCGGTTCCTACGCACAGCGCCCGCTGGCGT +CCTCGCGGCCCCCGATTCTGCATTGGCTCAGGCCCCGCCGGGCCCGAAAGGCGACGGTTT +CCGGTTAGTGGAATCACGGTCCCAGTCCTCGCGCGGTTCCTCAGCTCCGCCTGGTCCCTT +ACGGAGGCAAAAAACTACATTTCCCACAATCCCAGGGGGTGCGGGCCCTGGATATACCCG +CAGGTCCAGAATCGTTTCCGGACCACCCAGGGGCCGGATTCC +>ENSE00001478064 Reversed: +ACCACTTAAATACAAACTTTATTCTCTCTCCAAGAAGATGCAGACGTCACAGGTGGCCCT +GAGCTCCCACCCGAGGCTTAGGCCCAAGGGGCCTCTTCCAGGCTGAGGGCCTGCTGGGGC +TGGGCCAGGGGCTGAGGCTGAAAGCAGCAGCCTGCCTAGTGGGTGACGCCAGGGGCCGGT +GTAACATGGCACCGAGGTTGGGGCCACAGCAATGTGTGGGACGGTGGGGTGGGCTGGGGC +CCTTGGCTCCAAGCATTAGTTCTCCAAGCTCTGGTCCGTTCTCCTACCTCCTTCAAGGGG +CACCAGGGCTACAAGGTGGTAGTTGAGTATTGGGGCCCGACTCCTGGGGCACTGGAGTGG +TCTCTAGGCCCGAGGCCCCAAGGAGAGGGCTGGGTTTCTGGGAGAGTGCTGGTCCTTCCT +CTCTGGGCTTGGCCATCTTGACAGCTTCATCGTAGGAGGGTGGAGGCTCCGGGGTGTACA +GGCTGTAGGCAGGAGGAGCCATGGAGTCCAGGTCCAGCTCCCCAAAGGGCAGGGGCAACC +GCATGCCCAGTGGGTACTGCACGGAGCTGTAGG +>ENSE00001754010 Reversed: +CCACTTAAATACAAACTTTATTCTCTCTCCAAGAAGATGCAGACGTCACAGGTGGCCCTG +AGCTCCCACCCGAGGCTTAGGCCCAAGGGGCCTCTTCCAGGCTGAGGGCCTGCTGGGGCT +GGGCCAGGGGCTGAGGCTGAAAGCAGCAGCCTGCCTAGTGGGTGACGCCAGGGGCCGGTG +TAACATGGCACCGAGGTTGGGGCCACAGCAATGTGTGGGACGGTGGGGTGGGCTGGGGCC +CTTGGCTCCAAGCATTAGTTCTCCAAGCTCTGGTCCGTTCTCCTACCTCCTTCAAGGGGC +ACCAGGGCTACAAGGTGGTAGTTGAGTATTGGGGCCCGACTCCTGGGGCACTGGAGTGGT +CTCTAGGCCCGAGGCCCCAAGGAGAGGGCTGGGTTTCTGGGAGAGTGCTGGTCCTTCCTC +TCTGGGCTTGGCCATCTTGACAGCTTCATCGTAGGAGGGTGGAGGCTCCGGGGTGTACAG +GCTGTAGGCAGGAGGAGCCATGGAGTCCAGGTCCAGCTCCCCAAAGGGCAGGGGCAACCG +CATGCCCAGTGGGTACTGCACGGAGCTGTAGG +>ENSE00001478051 Reversed: +TTAGTTCTCCAAGCTCTGGTCCGTTCTCCTACCTCCTTCAAGGGGCACCAGGGCTACAAG +GTGGTAGTTGAGTATTGGGGCCCGACTCCTGGGGCACTGGAGTGGTCTCTAGGCCCGAGG +CCCCAAGGAGAGGGCTGGGTTTCTGGGAGAGTGCTGGTCCTTCCTCTCTGGGCTTGGCCA +TCTTGACAGCTTCATCGTAGGAGGGTGGAGGCTCCGGGGTGTACAGG +>ENSE00001810932 Reversed: +GGCACTGGAGTGGTCTCTAGGCCCGAGGCCCCAAGGAGAGGGCTGGGTTTCTGGGAGAGT +GCTGGTCCTTCCTCTCTGGGCTTGGCCATCTTGACAGCTTCATCGTAGGAGGGTGGAGGC +TCCGGGGTGTACAGGCTGTAGGCAGGAGGAGCCATGGAGTCCAGGTCCAGCTCCCCAAAG +GGCAGGGGCAACCGCATGCCCAGTGGGTACTGCACGGAGCTGTAGG +>ENSE00003350147 Reversed: +AGGTCCAGCTCCCCAAAGGGCAGGGGCAACCGCATGCCCAGTGGGTACTGCACGGAGCTG +TAGG +>ENSE00003428438 Reversed: +AGGTCACAGTGCTGTGTACAGGGCTGTCACTGTCCATAGGGATGACTGCCACGTCGCAGG +GCTGCCGTGCTGGTGGCAGATGTGGCTGGGCCTGTGCCTGCTTCCGGAGGCAGCAGAACC +GGACACAACCAGCTGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGCC +TAGGAGAGCAAGGCTCTACCACTGGACTGACCCTCGGCCACCGGGCACCTGCACCCTGGG +GAATGTCGTGGCACAACCACCGAAGACAGGTTAACAGGATAAAAAGCAGACAATGTCTCT +CCATGTCGGAGACCGCCGTGGCCAGAGCCTGGCCTCGGGCTGCTGGGCCTGCCCTGGCTA +TCTCTCCTGGGCTGGCCAGGGGTGGCCTTGGGCTCACTCCCAGGACTCGCTGTCCTCAGC +GAGTGCCCCACTGCTGAGCGGGATCGTAGGGGACTCCCGCGGAGGCCAGGCGGGAGAGGT +GGGAGGGAAGGTCCTGCTTGCTCCAGGTCAGTTCCCGCCAGCGGCCGGGACTGGGCGACA +GCGGAGGCGGCCTGGTGAGGTAAGGGCCTGGCGGGCCTGGCCCCGGTGACCCCCGCCCCA +GAACCGTCGGACGCACGGCTCCGCCGCGGCCTCCACTTACCCCACGTGCCACAGGCTGCT +CCAGCGGGCCTGGGGCGGGCAC +>ENSE00003652520 Reversed: +AGGTCACAGTGCTGTGTACAGGGCTGTCACTGTCCATAGGGATGACTGCCACGTCGCAGG +GCTGCCGTGCTGGTGGCAGATGTGGCTGGGCCTGTGCCTGCTTCCGGAGGCAGCAGAACC +GGACACAACCAGCTGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGC +>ENSE00003675447 Reversed: +AGGTCACAGTGCTGTGTACAGGGCTGTCACTGTCCATAGGGATGACTGCCACGTCGCAGG +GCTGCCGTGCTGGTGGCAGATGTGGCTGGGCCTGTGCCTGCTTCCGGAGGCAGCAGAACC +GGACACAACCAGCTGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGC +>ENSE00001858191 Reversed: +AGGTCACAGTGCTGTGTACAGGGCTGTCACTGTCCATAGGGATGACTGCCACGTCGCAGG +GCTGCCGTGCTGGTGGCAGATGTGGCTGGGCCTGTGCCTGCTTCCGGAGGCAGCAGAACC +GGACACAACCAGCTGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGCC +TAGGAGAGCAAGGCTCTACCACTGGACTGACCCTCGGCCACCGGGCACCTGCACCCTGGG +GAATGTCGTGGCACAACCACCGAAGACAGGTTAACAGGATAAAAAGCAGACAATGTCTCT +CCATGTCGGAGACCGCCGTGGCCAGAGCCTGGCCTCGGGCTGCTGGGCCTGCCCTGGCTA +TCTCTCCTGGGCTGGCCAGGGGTGGCCTTGGGCTCACTCCCAGGACTCGCTGTCCTCAGC +GAGTGCCCCACTGCTGAGCGGGATCGTAGGGGACTCCCGCGGAGGCCAGGCGGGAGAGGT +GGGAGGGAAGGTCCTGCTTGCTCCAGGTCAGTTCCCGCCAGCGGCCGGGACTGGGCGACA +GCGGA +>ENSE00001682091 Reversed: +TGTGACACCACACAGCAGAAGCAGGAGGACCGCCAGCAGGATGAGC +>ENSE00003599669 Reversed: +CCCACGTGCCACAGGCTGCTCCAGCGGGCCTGGGGCGGGCAC +>ENSE00003634508 Reversed: +CCCACGTGCCACAGGCTGCTCCAGCGGGCCTGGGGCGGGCAC +>ENSE00001937932 Reversed: +CCCACGTGCCACAGGCTGCTCCAGCGGGCCTGGGGCGGGCACCTGTGGGGACGGCGGCAC +CTGGAGCAGGCGGGGCATGGGACGGCCGACCTCGCCACCCGTGCCTCCCCATAGGGCGGG +GCCAGGCCCCGGCTCCCTCCCCCCCGACTTACTGGTCCGAGGGGTCGCAGCTGCCGTCCG +CGAAGCCCAGCGCCAC +>ENSE00001767147 Reversed: +TGGTCCGAGGGGTCGCAGCTGCCGTCCGCGAAGCCCAGCGCCACCTGTGGGGACAAGGGT +GAGCCCGGGAGGGGCGTGGTCCGAGCAGGGACCCGCCCCGCGGTGGCCGAACCGAGAGAG +AACGCCGCCCGACCCACCTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGC +AGCAGCCGCAGTCCGCGGGCGGCCAGCGGCCCCCGGGCCATGCTC +>ENSE00001736550 Reversed: +TGGTCCGAGGGGTCGCAGCTGCCGTCCGCGAAGCCCAGCGCCACCTGTGGGGACAAGGGT +GAGCCCGGGAGGGGCGTGGTCCGAGCAGGGACCCGCCCCGCGGTGGCCGAACCGAGAGAG +AACGCCGCCCGACCCACCTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGC +AGCAGCCGCAGTCCGCGGGCGGCCAGCGGCCCCC +>ENSE00003473336 Reversed: +TGGTCCGAGGGGTCGCAGCTGCCGTCCGCGAAGCCCAGCGCCAC +>ENSE00003561172 Reversed: +TGGTCCGAGGGGTCGCAGCTGCCGTCCGCGAAGCCCAGCGCCAC +>ENSE00003343061 Reversed: +CTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGCAGCAGCCGCAGTCCGCG +GGCGGCCAGCGGCCCCCGGGCCATGCTC +>ENSE00003293243 Reversed: +CTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGCAGCAGCCGCAGTCCGCG +GGCGGCCAGCGGCCCCCGGGCCATGCTCT +>ENSE00001239803 Reversed: +CTGCGGCAGCGGCAGGAGCGGCAGGAGCGGCAGGAGCGGCAGCAGCAGCCGCAGTCCGCG +GGCGGCCAGCGGCCCCCGGGCCATGCTCTGAG +>ENSE00003475992 Reversed: +AGGCAGATTGAAATGCTGACTTTCTCACTGTTTCATTTTGTGATTGAAGTGCGTGCAAAA +CACTCAATCTGGTAGGGATGATGCCCGCGCGGAGCTGACCCTTCTCCTATTGTTTTTCCA +AGCTGGAGAAGAAGCAGGCGCTCCCTCCATTCCAGCCACAGATCACAGACGACTACGGTC +TGGACAACTTTGACACACAGTTCACCAGCGAGCCCGTGCAGCTGACCCCAGACGATGAGT +GAGTCCCACTGGGTGCGGGTCCCTGGAGCACCCCTCGGGCAGCCCCATGGCAGGCCGGCA +CCTTGGGCAGCTGGTGACCCAGCCTGCCCTTGAGTCCCACCCGCCTGGTGTCATCTCTCC +AGTGGGCGTTGGGGGAGGATTCTTATGCGAACGTGACTCCGCTTCCCCCAAGGGAATGAA +CACACGGTCACCCCCCTCCCCCCTGCCACCTTTGCCCACAGGGATGCCATAAAGAGGATC +GACCAGTCAGAGTTCGAAGGCTTTGAGTATATCAACCCATTATTGCTGTCCACCGAGGAG +TCGGTGTGAGGCCGCGTGCGTCTCTGTCGTGGACACGCGTGATTGACCCTTTAACTGTAT +CCTTAACCACCGCATATGCATGCCAGGCTGGGCACGGCTCCGAGGGCGGCCAGGGACAGA +CGCTTGCGCCGAGACCGCAGAGGGAAGCGTCAGCGGGCGCTGCTGGGAGCAGAACAGTCC +CTCACACCTGGGCCCGGGCAGGCCAGCTTCGTGCTGGAGGAACTTGCTGCTGTGCCTGCG +TCGCGGCGGATCCGCGGGGACCCTGCCGAGGGGGCTGTCATGCGGTTTCCAAGGTGCACA +TTTTCCACGGAAACAGAACTCGATGCACTGACCTGCTCCGCCAGGAAAGTGAGCGTGTAG +CGTCCTGAGGAATAAAATGTTCCGATGATGTGGAAGCTCCTCTGATGCCTTTTTTCCGTG +AGTGGCGCCTGCCCCACATCTCAGACGCAACCCACACGTAGGGGGGCAGCTTAGGAGCCA +GCGGGACACAGGTGGGGGCGGGAGTTGAAGTAC +>ENSE00001817609 Reversed: +CAGATTGAAATGCTGACTTTCTCACTGTTTCATTTTGTGATTGAAGTGCGTGCAAAACAC +TCAATCTGGTAGGGATGATGCCCGCGCGGAGCTGACCCTTCTCCTATTGTTTTTCCAAGC +TGGAGAAGAAGCAGGCGCTCCCTCCATTCCAGCCACAGATCACAGACGACTACGGTCTGG +ACAACTTTGACACACAGTTCACCAGCGAGCCCGTGCAGCTGACCCCAGACGATGAGTGAG +TCCCACTGGGTGCGGGTCCCTGGAGCACCCCTCGGGCAGCCCCATGGCAGGCCGGCACCT +TGGGCAGCTGGTGACCCAGCCTGCCCTTGAGTCCCACCCGCCTGGTGTCATCTCTCCAGT +GGGCGTTGGGGGAGGATTCTTATGCGAACGTGACTCCGCTTCCCCCAAGGGAATGAACAC +ACGGTCACCCCCCTCCCCCCTGCCACCTTTGCCCACAGGGATGCCATAAAGAGGATCGAC +CAGTCAGAGTTCGAAGGCTTTGAGTATATCAACCCATTATTGCTGTCCACCGAGGAGTCG +GTGTGAGGCCGCGTGCGTCTCTGTCGTGGACACGCGTGATTGACCCTTTAACTGTATCCT +TAACCACCGCATATGCATGCCAGGCTGGGCACGGCTCCGAGGGCGGCCAGGGACAGACGC +TTGCGCCGAGACCGCAGAGGGAAGCGTCAGCGGGCGCTGCTGGGAGCAGAACAGTCCCTC +ACACCTGGGCCCGGGCAGGCCAGCTTCGTGCTGGAGGAACTTGCTGCTGTGCCTGCGTCG +CGGCGGATCCGCGGGGACCCTGCCGAGGGGGCTGTCATGCGGTTTCCAAGGTGCACATTT +TCCACGGAAACAGAACTCGATGCACTGACCTGCTCCGCCAGGAAAGTGAGCGTGTAGCGT +CCTGAGGAATAAAATGTTCCGATGATGTGGAAGCTCCTCTGATGCCTTTTTTCCGTGAGT +GGCGCCTGCCCCACATCTCAGACGCAACCCACACGTAGGGGGGCAGCTTAGGAGCCAGCG +GGACACAGGTGGGGGCGGGAGTTGAAGTAC +>ENSE00003589214 Reversed: +GACTTTCTCACTGTTTCATTTTGTGATTGAAGTGCGTGCAAAACACTCAATCTGGTAGGG +ATGATGCCCGCGCGGAGCTGACCCTTCTCCTATTGTTTTTCCAAGCTGGAGAAGAAGCAG +GCGCTCCCTCCATTCCAGCCACAGATCACAGACGACTACGGTCTGGACAACTTTGACACA +CAGTTCACCAGCGAGCCCGTGCAGCTGACCCCAGACGATGAGTGAGTCCCACTGGGTGCG +GGTCCCTGGAGCACCCCTCGGGCAGCCCCATGGCAGGCCGGCACCTTGGGCAGCTGGTGA +CCCAGCCTGCCCTTGAGTCCCACCCGCCTGGTGTCATCTCTCCAGTGGGCGTTGGGGGAG +GATTCTTATGCGAACGTGACTCCGCTTCCCCCAAGGGAATGAACACACGGTCACCCCCCT +CCCCCCTGCCACCTTTGCCCACAGGGATGCCATAAAGAGGATCGACCAGTCAGAGTTCGA +AGGCTTTGAGTATATCAACCCATTATTGCTGTCCACCGAGGAGTCGGTGTGAGGCCGCGT +GCGTCTCTGTCGTGGACACGCGTGATTGACCCTTTAACTGTATCCTTAACCACCGCATAT +GCATGCCAGGCTGGGCACGGCTCCGAGGGCGGCCAGGGACAGACGCTTGCGCCGAGACCG +CAGAGGGAAGCGTCAGCGGGCGCTGCTGGGAGCAGAACAGTCCCTCACACCTGGGCCCGG +GCAGGCCAGCTTCGTGCTGGAGGAACTTGCTGCTGTGCCTGCGTCGCGGCGGATCCGCGG +GGACCCTGCCGAGGGGGCTGTCATGCGGTTTCCAAGGTGCACATTTTCCACGGAAACAGA +ACTCGATGCACTGACCTGCTCCGCCAGGAAAGTGAGCGTGTAGCGTCCTGAGGAATAAAA +TGTTCCGATGATGTGGAAGCTCCTCTGATGCCTTTTTTCCGTGAGTGGCGCCTGCCCCAC +ATCTCAGACGCAACCCACACGTAGGGGGGCAGCTTAGGAGCCAGCGGGACACAGGTGGGG +GCGGGAGTTGAAGTAC +>ENSE00001635485 Reversed: +CAGTCCCTCACACCTGGGCCCGGGCAGGCCAGCTTCGTGCTGGAGGAACTTGCTGCTGTG +CCTGCGTCGCGGCGGATCCGCGGGGACCCTGCCGAGGGGGCTGTCATGCGGTTTCCAAGG +TGCACATTTTCCACGGAAACAGAACTCGATGCACTGACCTGCTCCGCCAGGAAAGTGAGC +GTGTAGCGTCCTGAGGAATAAAATGTTCCGATGATGTGGAAGCTCCTCTGATGCCTTTTT +TCCGTGAGTGGCGCCTGCCCCACATCTCAGACGCAACCCACACGTAGGGGGGCAGCTTAG +GAGCCAGCGGGACACAGGTGGGGGCGGGAGTTGAAGTAC +>ENSE00003459358 Reversed: +CCCTCAGGTGAAGGCACAGCTGTCCAGAGCTGAGGCTTCCTAGAGGCAGGGCTGCCAGCT +GCCAGGTGTCAGGTGTGGCAGAGCCGTCTTCTGAGCTCCCTGGGAGAGGGGGTCGCGCCA +CCTCATGCCTCTGAGTGAGGCCTGGTGCACAGGTGTGGAAATTGCCACGCAGCCCTCTTG +GCCAGGCGCAGAGACCCCAGGCCTCCATGACTCAGGGGCCGCTCCACCCCATTGTGCGGC +TGGTGG +>ENSE00003626371 Reversed: +CTAAATACTGCCGTGTTGCCAGTAGCGTGCCGGTTACCAGTTTGGCCGTTCTTGTACACA +ATATGTGAGTAATGCTGTGCTCATCAGAGGGGAGACTTTTATATTCAGTAATTTGTTTTA +TAAATTAAAGTGAAGGATGTATTGAAGTGTGGTTTGAAAAATCCTGATATTTGCTAATGG +CTCCGGTCACGACGGTGTCTTTTGGAAGTGGTTCTCGAAAACTCTGGTGACTTGGGGGCT +GCACAGTGGGCCTGCGTGGGCGTGGTGCGGGGCAACTGCCCATGGAGCCCGTGGCTGGCC +GGCTCTCCTGTGGATGACACTCACCCTTGACTGCCAGGGTCATTCAAAGTCTTGCACATC +CATGAAAGA +>ENSE00003526713 Reversed: +CTAAATACTGCCGTGTTGCCAGTAGCGTGCCGGTTACCAGTTTGGCCGTTCTTGTACACA +ATATGTGAGTAATGCTGTGCTCATCAGAGGGGAGACTTTTATATTCAGTAATTTGTTTTA +TAAATTAAAGTGAAGGATGTATTGAAGTGTGGTTTGAAAAATCCTGATATTTGCTAATGG +CTCCGGTCACGACGGTGTCTTTTGGAAGTGGTTCTCGAAAACTCTGGTGACTTGGGGGCT +GCACAGTGGGCCTGCGTGGGCGTGGTGCGGGGCAACTGCCCATGGAGCCCGTGGCTGGCC +GGCTCTCCTGTGGATGACACTCACCCTTGACTGCCAGGGTCATTCAAAGTCTTGCACATC +CATGAAAGA +>ENSE00001862783 Reversed: +GACGTTTCATCACAACACAGAGACAGACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGG +GGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAG +AGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTC +TTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGCCT +GCAAGGGAGGGGCCACACTCACTCGGCCACCTCCGCGGCATGCTGGCCGCAGAGAGCACC +GTCTGGACCTCCGGGCCCTCTCTGCTCCTGCCGCTGGAGAGGATCCGGCTGGTCAGAAAC +AAGGGACGGGGCCACCCCAGGGGCTCATGCACCCGGCAGACCACGGTAACCGCCAGTGGT +GTTTCCACACCGTGCCCGTGAGGAGGCCACGCCAGGCCCCTGCGTCCGAGCTGGGGGTGG +GGAAGCTGTGTCTCAACAAGCCTCTCTATGGGATTCTGGCGCCTGCTCAGCTTGAGAACG +CGCTCATCGTGGAGCCCGGCAGACAGGCGGCCTGACCCGGAGAAAAGGCAGGACGGCGGG +TGGCCTGCCAGGGAGAGCCGCCGCGGCTGCGTCTACAGGAGGCAGAAGAGTAAACATGGC +TGGGCAGTGGATGTGCAGCTCACGTCAGAGAATTGGTGTTTCTGGCGAGGAGGGACCAAG +CCTCACCACGGAGAAGGACGCCGTCACCGGCGTGCAGGCTGCCAACCTGCCACTCTGGGA +GGCCCCACGCGGCCCCTGCACCTCTCAGGAGGGCGCTGGCGCTGGGATGGTGGCCGGCCA +GGCAGGGGTGGCAGGAGAAAACCCATCCGAGTCCTGCAGGTCAGCGCCCTGGGCATCCAG +TGGGGCCGGGAGGGGTGTCTGAGCGCAGCCACCTTCTATCCCCGGCCTCATGTGGCCCCA +TCAGCCCAACTGGAGCGGCTGGAAATGACCATCACCAGGCCTGGCCAAGGTGTGGCCCTG +GAAGCCAGGACAGTTGACTTCCGGCCATGACTCCCGGAGAGTGCCGGAGCTGGCGTGCTC +AGCAGAGCTGCCGGGGACGATGTCCCGGGGCTGAGTGGGCGGCTTCAGCCTAGACTTGGG +CCTAGATCTTGCTGGAGGCCAAGTGGTCAGTGTCCCATCAGAGTGACCATCCCTCACACG +CCACTGCTGGGGGACACACCCCCACTGAGCGGCCAAGTCCACAGGACACGTGTCCCTGTG +TCCACCTGTCAGCCACACCGCCCCTCGCTCCCCTACAGCCTCTGCCCTCAGACCAGTCCA +CGGCGCGCCGTTTTACCCTTGGGCTTTGCTGTGTCCCTTCCTTTGGCTCCTGTGCCCCGT +CTGTGTGGCCACTGCAACCCTCAAGTCCCCCTCTCCAGACCATAGCTGGACCCCCACTCC +CGGGGCTGGCTCCAGCAGCCATCAGCTGCCTTCTCACTCTGGCAGAGCCCACCCAGTGCC +TTCTGAAGCCCCCGAGGGTCACTCAGTCTGAGACTTTCCGGCTTCTGCCCATCCTGGGAA +CCAGCCCCTCCCTCCAGAAGCTTTCTCTAAGGTTGCCAGAAGGTGCTAAGATCTGAACCG +AGGTCATCTTGTCCCGGGGTTTCCAGGCAGCGTCCCTTGTTTGGGGGCCCTCTGAGATGC +CTTCAGACCCCCGCCTGTGGCGGAAGAGCTTTGTCCTGGCCTGATCTGCCCTGTCCGTGA +CGCTTCTGCTCAGTAGCTGAGCACGCCCTGTGGTGTGGACAGGCCAGCCCGGCTGCAGGA +CAGTGGGGGCTCAGTCCAGAAGCCTCTGGTGGCTTCTGCGTGTGGGCAGGGGAGCAGGGC +TGCAGGGTGGGCTGGCACCTGGCAGCGTGAGGGGCCTCAGGGCTGTTAAAATCCCAACGA +CCGGCCGGGCGCGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAGACGGGCG +GATCACCTGAGATCAGTTCAAGACCAGCCTGACCAACATGGTGAAACCCTGTCTCTACTA +AAAATACAAAAATTAGCCAGGTGTGGTGACGCCTGTAATCCCAGCTACTCAGGAGACTGA +GGCAGGAGAATCGCTTGAACCCGGGAGGCAGATGTTGCAGTGAGCCGAGATCATGCCACT +GCACTCCAGCCTGGGCGACAGAGCGAGACACCGTCTCAAAAAAAAAAAAAAATCCCAGTG +ACCAACCCAGGGCCTCGCCACATCAACAGAGACAAAACGCAGCTCTGGCTCTCAACATCC +TCACCCCTCACCAGGTGCCCAGCTTCCCATCCACCCACGTGACCCGCAGGTGTCTGAAAA +TGCACAAAATGTCCAAATAGGACCACAAGAAGATCTTAAAGACACAAAGAACATTCTACA +TAGTTTGTCAAATCCAGCATTTGACGGTCCTCTGGGTGACCCGGAGAACACCAAGGCTGT +GAGAAATGGGAGGCCTCCTGGCAGCTCCACTCCCCAGACCCGCCTCTGCCAGGGCTCCAG +GCTCAGCAGGCGCCTGTGCGGGACAGGGCGACGGTTCAAGACCAAGTCCGGCTGTTAGAC +CAGACCCTCCAATCCAGGCGGCCTCCCTGCTGGGGTCCTGTGCGGTCAGGAGTCCCAGGG +CATCCCAGGGTGGCTGTGCAAACCCTTGTTCCCAAAGATATGGGGCTTGTCCCCCAGCTA +GCCTGCCCATGCGGTGGCCACAGCCTCGGGTGAGTTCCGGTTCCAAAGTACCGGCTCTCC +CTTACGATCAAGTGTTCGAATGTGCTTGAAGCATTCCAGACACACCAAGGCCTGGACCTG +ACTTCATTGACGCCTACTTAGGAAAAATTGAGGCAGTCTGCCAAGCTTTCAGCAACTGCT +TAAAAAGCTCAAAATGGCAAGTTTTTCCTCGTGAACGTCCTTGTCTTCAGAAGTCTTTTT +TTAGACTATCTGGAAAAGCAGGCGATGCAAAGACAAAAGCCCCTCCCCGGGGGGCGGGGG +GCAGCACCCTGACAGCAACAAGGATCTCAGAGCTTCAGCCAAGAGCATGGATTTCTCCCC +AGGGCTCCCAACAGTACCCTCTGTCCGTGATTCAGGGTCTTACTCTGTCACCCAGGCTGG +AGTGCAGTGGTGCAATCATACTTCACTACAGCCTCCAATTCCTGGCTCAAGGGAATCCTC +CCACTTCAGCCTCCAGAGTAGCTAGGACCACAGGCACGCGCCACCACGCCCAGGCATGTA +AAGATGGGATCTTGCCATGTTGCCCAGGCTGGTCTCAAACTCCTGGGCTCCAGCAACCCA +CCTGCCTCAGCCTCTCAAAGGGCTGGGATTACAGGCGTGAGCCACCGTGCCCGGCCTTTT +CTTTTGTTGTTGTTGTTGTTGGCTGCCAACTTTGGACTCCGGTGCCTTCGCATTCCCGAG +CTGTTTTTGCTTCTGGAAGACCAGGGGCATCAGGCATGACTGAAGGACCTGGTCTCCATA +AGCTCTGAAACCTGCCGCCCATTAACTCAACCAAAAGTTACGAACCAGCATCATTCACAC +CACCCCAGCCCCAGGACCTGCTCCGGAGGCCAAGGGCCCAGAGGTCGCCAGACACAAGGC +CAGGCACTGGGCAGTTTGGGTTATCTTGTTAGCAAAACTGGGTTCCATTCCCCTTTACTT +AAAAAATACATAAAAATATACGTTGGGTTTCAAAAATAAGAAAAAGCATCTCCAGACAAA +AAAGACGATCTTCATTTTTAAAACCCATGACGCACTCTCGGGAAGGTGTTCCTGTGCTCT +GGGCCTGGGGACGCTGGTGCCACCAGATTCCAGGATGGCCAGGTGGACCCGGGGCCAGTG +CTCCCAGCCTTCCTTCTGTGCTGTTCTGTGGGCCCCCAGCCTGCCCTGCCCACAGAGCAC +GGCAAGCAGGTGGACCCCAGACCCGTGACAGAGAGCCACCTGGACATGCCAGGCCACAGC +ACTGGGCCACCTTTCCAGTGTGAAACAGGGCTTTAAAAGCCAGCGCTGAGCTCGGCCACC +TCTTGACCTTCTGAACGGCTGTGGTTTCCAAACACGGATGGATAACCGGGCCGGGCGCAG +GGGTGGCCTACTCACCTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCC +GCGGCACCCTCCACAGACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCC +GGGCGCTGGGGCAGGGACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGC +CGGTAGGAACGGCCCGGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTG +GGTCCGACAGTGAAGACTTCAGTGGGCTCCGGGCCGCACCTGGGCTC +>ENSE00003569320 Reversed: +TTTCATCACAACACAGAGACAGACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAG +CCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCG +TGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCT +GTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGC +>ENSE00003681657 Reversed: +TTTCATCACAACACAGAGACAGACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAG +CCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCG +TGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCT +GTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGC +>ENSE00003483048 Reversed: +TTTCATCACAACACAGAGACAGACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAG +CCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCG +TGTCCGGGCGCCGCACTCTGCGCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCT +GTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGCTGGGTCAGC +>ENSE00001951400 Reversed: +GACAGGAGCCCGCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGC +GGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGC +GCAGGGCTCTTGGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGG +GCCAGGTGGCTGTCAACATCCAGCTGGGTCAGC +>ENSE00002033745 Reversed: +GCCCTGCTTTAATGCGCATGCGGGGGAGCCGAGAGGCGGGGCTGCTGGCGGGGGAGCCGA +GAGGCGGGGCTGCTGGCGGGGGAGAGCGTGTCCGGGCGCCGCACTCTGCGCAGGGCTCTT +GGATGGCGCTCACCACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCT +GTCAACATCCAGCTGGGTCAGC +>ENSE00003636009 Reversed: +CACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGC +TGGGTCAGC +>ENSE00003529933 Reversed: +CACGTCACGTCTTCTGTGCTTTCGGCCAAGCACTGGGCCAGGTGGCTGTCAACATCCAGC +TGGGTCAGC +>ENSE00001602311 Reversed: +TAGGACCACAAGAAGATCTTAAAGACACAAAGAACATTCTACATAGTTTGTCAAATCCAG +CATTTGACGGTCCTCTGGGTGACCCGGAGAACACCAAGGCTGTGAGAAATGGGAGGCCTC +CTGGCAGCTCCACTCCCCAGACCCGCCTCTGCCAGGGCTCCAGGCTCAGCAGGCGCCTGT +GCGGGACAGGGCGACGGTTCAAGACCAAGTCCGGCTGTTAGACCAGACCCTCCAATCCAG +GCGGCCTCCCTGCTGGGGTCCTGTGCGGTCAGGAGTCCCAGGGCATCCCAGGGTGGCTGT +GCAAACCCTTGTTCCCAAAGATATGGGGCTTGTCCCCCAGCTAGCCTGCCCATGCGGTGG +CCACAGCCTCGGGTGAGTTCCGGTTCCAAAGTACCGGCTCTCCCTTACGATCAAGTGTTC +GAATGTGCTTGAAGCATTCCAGACACACCAAGGCCTGGACCTGACTTCATTGACGCCTAC +TTAGGAAAAATTGAGGCAGTCTGCCAAGCTTTCAGCAACTGCTTAAAAAGCTCAAAATGG +CAAGTTTTTCCTCGTGAACGTCCTTGTCTTCAGAAGTCTTTTTTTAGACTATCTGGAAAA +GCAGGCGATGCAAAGACAAAAGCCCCTCCCCGGGGGGCGGGGGGCAGCACCCTGACAGCA +ACAAGGATCTCAGAGCTTCAGCCAAGAGCATGGATTTCTCCCCAGGGCTCCCAACAGTAC +CCTCTGTCCGTGATTCAGGGTCTTACTCTGTCACCCAGGCTGGAGTGCAGTGGTGCAATC +ATACTTCACTACAGCCTCCAATTCCTGGCTCAAGGGAATCCTCCCACTTCAGCCTCCAGA +GTAGCTAGGACCACAGGCACGCGCCACCACGCCCAGGCATGTAAAGATGGGATCTTGCCA +TGTTGCCCAGGCTGGTCTCAAACTCCTGGGCTCCAGCAACCCACCTGCCTCAGCCTCTCA +AAGGGCTGGGATTACAGGCGTGAGCCACCGTGCCCGGCCTTTTCTTTTGTTGTTGTTGTT +GTTGGCTGCCAACTTTGGACTCCGGTGCCTTCGCATTCCCGAGCTGTTTTTGCTT +>ENSE00001720216 Reversed: +TCTGTCACCCAGGCTGGAGTGCAGTGGTGCAATCATACTTCACTACAGCCTCCAATTCCT +GGCTCAAGGGAATCCTCCCACTTCAGCCTCCAGAGTAGCTAGGACCACAGGCACGCGCCA +CCACGCCCAGGCATGTAAAGATGGGATCTTGCCATGTTGCCCAGGCTGGTCTCAAACTCC +TGGGCTCCAGCAACCCACCTGCCTCAGCCTCTCAAAGGGCTGGGATTACAGGCGTGAGCC +ACCGTGCCCGGCCTTTTCTTTTGTTGTTGTTGTTGTTGGCTGCCAACTTTGGACTCCGGT +GCCTTCGCATTCCCGAGCTGTTTTTGCTT +>ENSE00003630334 Reversed: +CTGCCTCAGCCTCTCAAAGGGCTGGGATTACAGGCGTGAGCCACCGTGCCCGGCCTTTTC +TTTTGTTGTTGTTGTTGTTGGCTGCCAACTTTGGACTCCGGTGCCTTCGCATTCCCGAGC +TGTTTTTGCTT +>ENSE00003481862 Reversed: +CTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACA +GACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGG +GACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCC +GGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAG +ACTTCAGTGGGCTCCGGGCCGCACCTGGGCTC +>ENSE00003510741 Reversed: +CTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACA +GACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGG +GACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCC +GGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAG +ACTTCAGTGGGCTCCGGGCCGCACCTGGGCTC +>ENSE00003548540 Reversed: +CTGGGGGCGAACTCCTTCTGGCACATGGGGCAGCTGCGCAGGGCCGCGGCACCCTCCACA +GACGGCTGCTGCTCCACCCTGGGGGCCCTGCAGGGATCAGGTGCCGGGCGCTGGGGCAGG +GACCTGGCGGGGGATTCCAGGTGCCCTCCTGCCCCGTGAAGCAGCCGGTAGGAACGGCCC +GGGCCCCACAGGTCCGGCGGAAAGGGTGTCCAGGAAAAGGTCTTGGGTCCGACAGTGAAG +ACTTCAGTGGGCTCCGGGCCGCACCTGGGCTC +>ENSE00003634783 Reversed: +CTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCAC +CGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAGAAACCAGGG +GCGGCCGCCAGAAGGC +>ENSE00003467961 Reversed: +CTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCAC +CGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAGAAACCAGGG +GCGGCCGCCAGAAGGC +>ENSE00001841545 Reversed: +CTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCAC +CGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAG +>ENSE00001816369 Reversed: +CTGTCCTGGGAAGGCGGGCAGTGAAGGCACCTCGTGATCCAGGATCAGCTCCGGGCTCAC +CGTGCGCAGTAGCTCGGCCCAGAGCCGCTCCCGCTCATCACCCCCCAGGAGAAACCAGGG +GCGGCCGCCAGAAGGCCTGGGGCAGACAGAGAGGGCAGACAGGGGGTACTCAGTAGCGGA +AACGCTATGGTGGGGAGACCCGGGAGGGCCTGGGGC +>ENSE00003618179 Reversed: +CCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCC +>ENSE00001545345 Reversed: +CCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCC +A +>ENSE00001822711 Reversed: +CCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCC +ATCCAAGCCCGCGCCGGGCGGAAGTGA +>ENSE00002226200 Reversed: +CCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCC +ATCCAAGCCCGCGCCGGGCGGAAGTGAG +>ENSE00001477870 Reversed: +CCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCC +ATC +>ENSE00001816144 Reversed: +CCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCGCCGCCTCC +ATCC +>ENSE00001720995 Reversed: +CCGCCCGCCGGGCGCGGCCTCCGGCGGCTCAACCCCAGCCGCGGCCTCCGCG +>ENSE00002040955 Reversed: +CTTGTCCTGCCTGTCCTCAAGTTATCAGCATGACACAGCGGTGCTGGTGATGGTGATGGT +GGAGGTTTCAAAGTTGAACCTGATGAAAACGCTCCACTTCTTCGGAGCCATCTGCTGCTG +TGGTGACGGAGTTTTGCTTTATTGGAAAATAATTTCTGGTTGGGACTGACACGTGCACAG +TGGAAATGAGTTTTTTCTAAGCCAAAATTCATGTTTACAAAAGAACGTTTCAGCTGTGGG +AGTTTGCATCCCAGGCAGAGCAGAAGGTGATCGAGTGGGTGGGGGCATCAGAGCCACCCA +TCTCCTACTCCCGCACCTGCAGACCGGTGGGCTAGGAGGCCCCTTACCCTCTGTGGCAAA +AAAGGACACATTTATGGATGATGAATCAGGCCCCAGCCCACTGAGCTGGTTTCAGAAGCC +AGGCTGGCCGTAGGTCAGGGAGCCAGGCCTCTCCAACTCCTTCCACCGCGGAAGAACAAG +TGTCCCAGCCACTGGCATCCTCAGAGTCACCCAAATGTTCATCTCTGCCCAGCGCTGACA +CCCTGCAAATCAGGCTAAGACAGCGGTGACGGGCCCTGAGGCTGGCAGGCCTAAGCAGCC +CGGTGGCCGTGCACCCTCCCAATTTCCAAATGAGACCTGTGGCCGACAGGCACCCTGGGC +ACATGCTGAAGGCACTGGGCTGCCTCCACCCCTTCCCATGTGGCTAAATGGCCCAGCACC +CACACACGGTGCCCTGGCAGTGCTCACCTGCTGGCAAGGACAGCCAAAAGGCCCGGGCAG +CCTTCTGACGCAGCCAGGAACTGGGCTGTGCTCCACCACACCTGCTGGCCCGTGGATGCC +AGGCAGGCACGCCCACCCATAGCCAGATGTGGTGGCATTTATGGGATACGGGAGTGCCAG +GCAGACAGGCTGTGAGAGACAGTTGCCTGGGAAACATCGCCAGATCTTTGGGGCAGCAGA +GCAGGTGCTCGGGCCCACACATGGGGTGCAAGAGTAGGGGTGTGCCTTGGTGCCCTTGGG +CACCGACAGCCTCCTCACAGCCTCAGTGGCGGGGTCATGGCACAGGCCTGCCCCTGACCC +CAAGAACCAGAAAGCCAGGAGCAGCTGGGGAGGGCCCTGGCCCGGGAGAGACAGCGGTCC +TGTTTCTGAACCCCATCCCAGCCATGGCCTGTGTCTGGGCCAGCATCCCCGACCAGACAG +GGCCAGCCGCCCTCTCTCAAAGTCCCCAGCACCCCTTCAAGCAGTATCCGGTTCACACCC +TCCCACAGCCTGTCCTCCATCCCCACGTGTCGGGCTCAGCTTCCGCACCACTCAGCCCCC +ACCCAGGGGCGGGCTTTTATCAGCCCCAGATCCTGCTCTGACGTCCCCCCGCCCGGAGAA +GCTTCCCCAGCCCAGCCCAGCCCAGCCCAGCCCAGGCTTCTCTCTCCACCCCACTGCCCT +GCTGGGAAATTGTGAGCTCAGATGCTGATTGGTCTACCCAGGAGGGCGGTCCTGTGTGCT +CTGTTCCCTGGGAAGCCTCTCAGAGTGCGCGGCACCAAGGAGCCGGTCAGGGAGTGGAGA +CCTCTCAGGGCACCCCTCCTCTGGGGAAGGCAAGTCACAGAAACCAAGCTGGAGGAGCAC +TGTGGGTTGAGCAGCGTCTCCGAAGACTCATGTCCACCAGTACCTGAGAAAGTGGCCTCG +CTCGGAAGCAAGGTCTGTGCCGATATAATCAAACCAGGATGAGGCGATACTGGGTTAGGG +TTGGCCCTGAATGCAGTGTGAGCAGTGTTCTTGTAAGAAAAGGAAAATTGTCCGGGTGCA +GTGTCTCACGCCTGCAATCCCAGCACTTTGGGAGGCCGAGGCGGGCAGATCACTTGAGGT +CAGGAGTTCTAGACCAGCCTGGCCAACATAGTGAAACCCCG +>ENSE00003615416 Reversed: +CTTGTCCTGCCTGTCCTCAAGTTATCAGCATGACACAGCGGTGCTGGTGATGGTGATGGT +GGAGGTTTCAAAGTTGAACCTGATGAAAACGCTCCACTTCTTCGGAGCCATCTGCTGCTG +TGGTGACGGAGTTTTG +>ENSE00002044438 Reversed: +TGGTGGAGGTTTCAAAGTTGAACCTGATGAAAACGCTCCACTTCTTCGGAGCCATCTGCT +GCTGTGGTGACGGAGTTTTG +>ENSE00001853635 Reversed: +CTGCTGGCAAGGACAGCCAAAAGGCCCGGGCAGCCTTCTGACGCAGCCAGGAACTGGGCT +GTGCTCCACCACACCTGCTGGCCCGTGGATGCCAGGCAGGCACGCCCACCCATAGCCAGA +TGTGGTGGCATTTATGGGATACGGGAGTGCCAGGCAGACAGGCTGTGAGAGACAGTTGCC +TGGGAAACATCGCCAGATCTTTGGGGCAGCAGAGCAGGTGCTCGGGCCCACACATGGGGT +GCAAGAGTAGGGGTGTGCCTTGGTGCCCTTGGGCACCGACAGCCTCCTCACAGCCTCAGT +GGCGGGGTCATGGCACAGGCCTGCCCCTGACCCCAAGAACCAGAAAGCCAGGAGCAGCTG +GGGAGGGCCCTGGCCCGGGAGAGACAGCGGTCCTGTTTCTGAACCCCATCCCAGCCATGG +CCTGTGTCTGGGCCAGCATCCCCGACCAGACAGGGCCAGCCGCCCTCTCTCAAAGTCCCC +AGCACCCCTTCAAGCAGTATCCGGTTCACACCCTCCCACAGCCTGTCCTCCATCCCCACG +TGTCGGGCTCAGCTTCCGCACCACTCAGCCCCCACCCAGGGGCGGGCTTTTATCAGCCCC +AGATCCTGCTCTGACGTCCCCCCGCCCGGAGAAGCTTCCCCAGCCCAGCCCAGCCCAGCC +CAGCCCAGGCTTCTCTCTCCACCCCACTGCCCTGCTGGGAAATTGTGAGCTCAGATGCTG +ATTGGTCTACCCAGGAGGGCGGTCCTGTGTGCTCTGTTCCCTGGGAAGCCTCTCAGAGTG +CGCGGCACCAAGGAGCCGGTCAGGGAGTGGAGACCTCTCAGGGCACCCCTCCTCTGGGGA +AGGCAAGTCACAGAAACCAAGCTGGAGGAGCACTGTGGGTTGAGCAGCGTCTCCGAAGAC +TCATGTCCACCAGTACCTGAGAAAGTGGCCTCGCTCGGAAGCAAGGTCTGTGCCGATATA +ATCAAACCAGGATGAGGCGATACTGGGTTAGGGTTGGCCCTGAATGCAGTGTGAGCAGTG +TTCTTGTAAGAAAAGGAAAATTGTCCGGGTGCAGTGTCTCACGCCTGCAATCCCAGCACT +TTGGGAGGCCGAGGCGGGCAGATCACTTGAGGTCAGGAGTTCTAGACCAGCCTGGCCAAC +ATAGTGAAACCCCGTCTCTACTAAAAAACACAAAAATTAGCTGGGTGTGGTGGTGGGCGC +CTGTAGTCTCAGCTACTCGGGAGGCTGAGGCAGGAGAATCGCTTGAACCCAGAAGGCAGA +GGTTGCAGTGAGCCAAGATTGTGCCATTTTACTCCAGCCTGGGCAACAGAGCAAGACTCC +GTCTCAAAAAAAAAAGAGAGAGAGAAAGAAAAGGAAAATTGGCCAGGTGCTGTGGCTCAT +GCCTGTAATTTCAGCACTTTGGGAGGCCGAGGCAGGTGGATCATGTGAGGTCAGGAGTTC +GAGACCAGCCTGAAAGACATCGTGAAACCCCATCTCTACTAAAGATACAAAATTAGCTGG +GTGTGGTGGTGGGCACCTGTAATCCCAGCTACTTAGGAGGCTGAGGCAGGAGAATCGCTT +GAACCCAGGAGGCGGAGGTTGCGATAGGCCGAGATCGTGCTGTTGCACTCCAGCCTGGGC +GACAAGAGCAAAACTCTATCTCAAAAAAAAAAAAAAAAAGGTAAGGAAAATTTGGACACA +GAGACACAGGAAGGAGGCTTTGGGGTTGGGGGTGGAGCAGCTGCACGCCAGGGAATGCCG +GGGGCCCGGGGCTGGAAGGGGCAGGCAGCAGCCACCCAGAGCCTTTAGGCGGAGCTCCAC +CCTCCCAACCACTGATTTTGGACACCAGCTGCCTGAACTGTGAGAATATACATGTCACTC +GTTTTAGGCTCCCAGTGTGTGGTCATTTTTTCACAGCAGCCCCAGGAGACACGCAGCAGG +CTCCCGGCTTTCCAAGCCGCCACGCACCAAGTTCAGCTTGAAAACGCTGAGCCCAGCTGG +GTGCGGGGAGCCCTCGGTCTCCTGTCCACCACACCCGGAGCTGAGGAAGAGGCTCCCCCA +TGGGCCAAGAGCTGGAAGGGGGCCCTTGGAGGATCCCCCAAGGTCCTCCAAGTGGGCCAG +GAAACCTCTGCAGGTGGAGAGGGTGGCTGGGACCCCCTCGGGAGTCCCCAGGGAAGGTCT +GGCTTCTCGGCTCTGTAGAATCAGCTTTGTCCCCAGTTCAGCACGTTTTTATGGGAAATC +TGCTGGCTGGGGACAGCCCTTGATGTCCTGAGATGAGATGCTGCCTGGTCCCTGCACCTT +CCAGGACCCAGCTCACCTGTGGCGCACAGGTTTCCACTTGTCATAGGAAACTGTGCTTGG +TGCATCCCCTGTGCAGCCGGCTGTGAACTGTGGGCTCCAACCCTGCTTGGTTTGCTTCAA +CTTTCTGAGTGACGTGCAGACCTTCACAGAGGAGCCGTGGGGTGGCTCCATCCAACGCCT +CCCTCGCTGCCC +>ENSE00001859055 Reversed: +CTGTGGCGCACAGGTTTCCACTTGTCATAGGAAACTGTGCTTGGTGCATCCCCTGTGCAG +CCGGCTGTGAACTGTGGGCTCCAACCCTGCTTGGTTTGCTTCAACTTTCTGAGTGACGTG +CAGACCTTCACAGAGGAGCCGTGGGGTGGCTCCATCCAACGCCTCCCTCGCTGCCC +>ENSE00002034769 Reversed: +CGGTGCAGGCCACCCTGCTGCTCCAGCTCAGTCCAGCACAGGTGTTCTCGCTCTGGGGTT +GGCCTGGCGCTGACCTGTGCACCTGACAGGGAAGGTAGGCAGCTCTGGAGCTGGCTGGTG +CCCCTCACCTGGGGTGGAGCTGGGGCAGGTCCCACATTTCTCAGAAGGACTCCAGGATGC +AGCTGCGTCTGGGGCCTGAGCGGAGGGAAGATATCAGGCTGGGGCCGGCTGCTGGGCCTG +TCCTCTCTGAGTTGCCTCAAATCCCCTGTTCCTTGAGCGGTCCTGGAGCCTGGCCTCAGG +CCTCAGGGCACCACACTACTTGCCTCCAGGGACCAGCCTGTTCACCCCACACCCAGCCCT +GTGACAGAGGTGCTGTCGCGTGGCCCCACTTACAGATGGGTCAACTGAGGCCCGGGGCAT +CTGTCCACTTGTCATGACAGTGAGCGG +>ENSE00001916683 Reversed: +CGGTGCAGGCCACCCTGCTGCTCCAGCTCAGTCCAGCACAGGTGTTCTCGCTCTGGGGTT +GGCCTGGCGCTGACCTGTGCACCTGACAGGGAAGGTAGGCAGCTCTGGAGCTGGCTGGTG +CCCCTCACCTGGGGTGGAGCTGGGGCAGGTCCCACATTTCTCAGAAGGACTCCAGGATGC +AGCTGCGTCTGGGGC +>ENSE00001937728 Reversed: +CTGGGGTGGAGCTGGGGCAGGTCCCACATTTCTCAGAAGGACTCCAGGATGCAGCTGCGT +CTGGGGC +>ENSE00001845014 Reversed: +CTTTTGGAGGGAGTGGCCCAGCTCTCCCGGCCTTTGCCACCCGGCGTCCTGTCCCAGTTT +ATCTGTGTCCAGTCCGATTGATGGGCTCATGGATTGGAAAGCTGTGACAGACGCCCTGGG +>ENSE00001908868 Reversed: +CGTGGGGTGGGTGTGATTCTGAGACTAAGGCTCTGGGGGCCGGGCGTGGTGGCTCACGCC +TGTAATCCCAGCACTTTGGGAGGCCGAGGCGGGCGGATCACGAGGTCAGGAGATCGAGAC +CATCCTGGCTAACACGGTGAAACCCTGTCTCTA +>ENSE00001934415 Reversed: +TGGAAACTCCCTGTCTTGGGGCCGCGCACACCATGCCTGGCAGGAGCTGGAGATGCAGCA +GAGCAGACGCGGCTGCAGGAGCAGCCGTGTTTCCTACAGTGGAGAAGGGGACCCTGGCAG +GAGCACTGCCCAGCCAGGCACGTGGTGCTCAACCCTGTGGGCACTGACCCCACAAAAG +>ENSE00001714381 Reversed: +TGCTGGGATTACAGGCGTGAGCCACTGCGCCAAGAGCAAGCTTCTGATGTAGGGGCTGCG +GGGGGCTTCCCAGGCCAGGCAGGTTGCTGTCTCAGCGCCAGCGTGTAGCCTCCTCCCAGG +ATCCGGAGCAGGAGGGTGGCTGTCTTTTGCGTTCAATCCGCTGGGCTGCTGTGGGGTTCC +CGCAGAGCTGCTCCAAGGGGCCGAGAGAAGGAAGGACGCTGCCCCCAAGGACAGACGGGC +AAGCTGGAGTCAGGAGAGGCGCAGCCGTGGCCCACAGGCCTTGGATCT +>ENSE00001821386 Reversed: +CGAGAGAAGGAAGGACGCTGCCCCCAAGGACAGACGGGCAAGCTGGAGTCAGGAGAGGCG +CAGCCGTGGCCCACAGGCCTTGGATCT +>ENSE00001724829 Reversed: +CTCCAAGGCCTGGGCGGCAGGAAAGG +>ENSE00001927358 Reversed: +CTCCAAGGCCTGGGCGGCAGGAAAGGGAGAGATGACGTCATTGCCGCCTGGAATCTGCTG +TTTGGAGGCGTCGCCATGGAGACCGGAAGGCTCAGGGTGGGTAAAAATAGCAAACCCAAA +AGGGTGTAAGTTCCAAGAACGCGAGTCTCTGAAAAGCGAGGCATCCATGTTC +>ENSE00001755234 Reversed: +TAGTTGTATAAATCAGCAAGTATTTATTTTAAATAATAAAACTACAGTTTTATACCATAC +ATATTTACAAAAATGCTTTGCTATAGAAAAATAGAATCAATCACTGAATCCAGACCACCA +CAGTGGAGAACCTCCTGGTGAAGCTGTGTTTTTTCCCACACTGGAAACACAGAGTAGCCC +TGTTTCTGCACACGTTAGTGCACCGCTGCTACGTGTGGCCGCCCAGCTGTCTGCAGGCTG +TGCCGACCACTGCCTCTGTCTCCAGGAAGCAGAGGCAGAAGTGATCCTTGCTGAGGAGGG +CCATCGAGTCTCCGCTTAAATGCCAGCACAGAGAGAGCACTGCAAAGTCGCCTAGAGAGA +GACAGGTGGCCAGAGGATTACAGCAGGGGAGGCCCAGATTCTGGGGGATGGGCACCCCCT +TGTCCTGCAGGCCAGCACAGTGCCTGGAGTGACCCACATAGGCAGAGCCAGGGTGGAGCC +CCAGAGCTGCCTCAAGTCAGGGAGAGGCTGCTTCTAGCCCATAAAGCTGAGGGCAGCGGG +TCCCCTGTGTGTCCGTCTTGAGGTTTACGCAAAGACTCTGAGGGCAGTTTCCCTGGAGTG +CTGCCGGAGACAGCAGCTGGGCTTCAACAGTTCAGCCCGTGTGATGCCAGACTGCACACA +GCAAGGCTGCCACGTCCGTGGCCTCGGGGATGTGCTTACCTTCCCCAGGCACCTGCACCG +ACATGCAGCCCGCTGGGGACCACAGGTAGAGCCTGCTGCCTCCCGTGCAGATGGCCAGCC +GCGGCTGCTGCGGGTCCCACTGAAATGCGCGCACTGGGGACAGCTGCTCGAGCACCGCGA +ACAGCCTCAGCTTCTGAATGTCCCAGACCCAGACGGCATTGGGAATGTTGT +>ENSE00001697450 Reversed: +TAGTTGTATAAATCAGCAAGTATTTATTTTAAATAATAAAACTACAGTTTTATACCATAC +ATATTTACAAAAATGCTTTGCTATAGAAAAATAGAATCAATCACTGAATCCAGACCACCA +CAGTGGAGAACCTCCTGGTGAAGCTGTGTTTTTTCCCACACTGGAAACACAGAGTAGCCC +TGTTTCTGCACACGTTAGTGCACCGCTGCTACGTGTGGCCGCCCAGCTGTCTGCAGGCTG +TGCCGACCACTGCCTCTGTCTCCAGGAAGCAGAGGCAGAAGTGATCCTTGCTGAGGAGGG +CCATCGAGTCTCCGCTTAAATGCCAGCACAGAGAGAGCACTGCAAAGTCGC +>ENSE00001797222 Reversed: +CTTCCCCAGGCACCTGCACCGACATGCAGCCCGCTGGGGACCACAGGTAGAGCCTGCTGC +CTCCCGTGCAGATGGCCAGCCGCGGCTGCTGCGGGTCCCACTGAAATGCGCGCACTGGGG +ACAGCTGCTCGAGCACCGCGAACAGCCTCAGCTTCTGAATGTCCCAGACCCAGACGGCAT +TGGGAATGTTGT +>ENSE00001862304 Reversed: +TTTTTTTTTTTTTTTTAGCCCTTTACAAATGGAGAAACCCTTAACAAAAGGCGGGCTGCA +GTGTGCCCAGCCCTGCTTTCTACTCAGCAGAGTGGAGCAAGTGAGCAGGGTGGAGGCCTC +CTGACTCATGCGCGGACCTGCGGCTGCTGCAGGACAAAGGCCCAGCGCCTCCAAGGAGCT +TCTGTGAGCACCTCGGCTACTGCAGAAACGTGAAAGGAGGTGACGTGTCGGAAACCCCCA +ACTTCATTTTCTTTTCCAGTCGCTTCTACACCTGGGGCCACAGGACACAGTAAAGGGTGA +GACAGCACCTGCGTCAGCACAACTGACCGTTCCTTGTCGCCAGGAAGTAGCTGTCAGGAC +TAAATGCCAGCATTCCTATGCCGATTTTCGGGTTTGCTCTGTCGGTAACAGGTTTCAGTG +TCTGTAAGGAGACTGGGACAGAGGCGATCTCATCTAGAACACCAACAGGAAGAACACGCC +ATTGTCACCCTTTCGGGAAGTACGCACGCGGCTGAGAGGCTGCTGTGCCTGCATCGGGCA +TCGCGAACCCAGCTCCTCTGTTCAAAGGGGAGGAAAGTGCGGCCCAAGGGCAGGAAGAGC +TAAGCAAAGCCTGGCAGCCGCAGCGAGGGGCCTGCCCGCAAGTGCCCCGGATGAGAGTGG +CACCATCACCTGCCAGGCCCGACTAGGTGGGGGGTGGACCCCACGTGCCAGGGGCTGACT +GGAGAGGGACATGGACAGGTCCTAGCTGCAATCTCAGCAGCTCCAACTCCTCAGCACTTT +TCTGTCGACTACCAGCATCTGAGTTCACAATCCCTTCCACCTCAGCGTCAGTACCCTTAG +ACTTTCCGGCTGTGGAAGAACCATCATCACAGCAGAAGCAGGGGCTGTGGAACAAGGACG +CCCCTGGGCTCCTGGGGAGCGCCTCCTGTGTGCCAGGCTGCACCTGTCCTGACCCCCATC +CTGAGCACACACCGAGCCCCGGGGTGGGCCCGTCGGCACTTGGGGCACCGCTTCCTCTAC +CTGCAACCTTCAGATGCCCTCATGCCCCTGTGGGATGGGTGCTTTTACTATGCCCATTTC +AGCGATGAGGAAACAGACACATAGGAAATGCCCAGAGTCAAGAGGCTGCATCAGAACCGG +GCCTCAAGCCGGAGACAGCGCTCGGGAGCACCGCCGGGTTCCAGACCCACTCTGAGCGCC +ACCCACGGAAAAGTGTTTCTTTGAAAAACATCATTCTCGGAGCTCCGGAAAAACATCCCC +TCGGAGCTCCCGCTGTCAGATCCGGGTCTCCAGGGCTCATATTCAGTAACAGAAGCCGCA +CCTTCACGGCCCACTGCGCAATTCAGACCCTAGTCAACCTCCAGCCAACAGGCTGAGGGG +CACACTGGCTGGAAGCATGGAAGGGAAAAAAAGTTTTTTTTTTTAAACATAAGGAACATC +CGAAGTTTATCTGGACAACGAGGAATCTTGCATTAAAAAAGGAAAACAAATGACATCACA +TGTGCTACTTACATTTACTCTCTGAGCTCGGGAGAGGGCCGGCCCCGGCCCGGGGCGGCG +GGAAGGAGAGGCAGCCCAGTCCCAGCTGTGGGCTCTTCTCGGCCTCCTTATACACCACCT +GAAAGACACAAGGTGGCCACGCCCGGCTCAGGACAGGGACCCGGAAGCCAAGGATGGACG +TGGCAAATGCCCATGACAGCGCATGGTCAACAGGTGTGCCTGCCATGACAGCTGGTCCTG +CTGCCACCGGGAGAGACGGAAGCACGAACCCCGCAGTCCCGAGAGCTGAGATCACCCAGC +CACCCTCTCTCGTGTCCTGCTGAGGAGCCCACCCTTTGAGACACAGGCAGCAAATGTGTG +CCCTGTGATTACAGACGGGAGACCACTGCAGCCACCATCATCCAGCAAGGGAGTGGGCTC +AGCCTTCCCTCCGTGATAAGAGGATACAGAGAACACTTGCACCAACACAGCAGAGGCCCC +GGGAGCAGCAGACACAGACCCGAGGTGGGGGCATCTGTGCCCGAGAGCCTGGCAAGCAAA +GGACAGCGGCCCAGGCTCAGTGGAAGGCGGGCAGCCCCTACGCCCCTGAAGAGCCCCAGG +TAAGGGAGTCACCTGGCCTGGTTCATGCCTTTAAAGCATGCTCTGCTGCTGTGTGGCGAA +GGGATTTGGAGAATGCAGGAATCACAGGCAAACCTTCAGGACCTGTGTGGCCAGCCCTGC +TCGGGCTCACCTGTCCAGACACCCTGGCCTCCAGCCACACAAGCCACTGGCCACGTCAGG +AGGCCCCTCTGCCTGAAACACCCTTTCTGCCCAGACACCGCGCAGCTCCTCCTCCTGGTC +TTCACTTAAACACCCCTCCAGGATGCATCCCCGGCAGTGGCTGATCTGGCATGCGCAGCC +CCAGCCACTCACTGGCCTCTTCATCGAATCCAAGCCGCCTTTCACTCAGCTCTGTCGGTT +ACAGGTCAACACCAGGAGGGCAGCATTTGTCTCTGGCTCCCAGCGCAGTGCCCGCTGCAC +ACATGGATGCGTGGCCCACTCCTCGGGGCCTTTGCATTTCCTGTTCCCTTGGCCTGGAAC +GCTCCCTCCCCGAGTCCCTGATCACTGGTGCAGCATCTGTGCCTGCGATCCCTCGCTGGT +GGCCACTCCCTGCCACCCCGTGGAGACACCCAGCTCTCCAGCCCCTTCCCTGTCTCTCCA +GCCGCACTCTGCAAGTGCAGGGGTCTGTCTCTTCTTCTCTGGCTGCGGCCCAGAGCACAG +TGCCTGGCACGACAGCAGATGCCCAGTGTTTGGGGGCAGGAGACCCTGGCCACTCTGTAC +AGCACAGGGATCTGCATCCAGACAGACCACAAAGGAGAAAACTGGACTGGGGTGGCAGCG +GCAGAGGACAGGCCAGGGCAAGGCCCACTTCAGACCCTTTGGGCAGCGTGGAGGAGGAAG +AACAAAGGCCAGGGCAGGGCCAGACGCGTGAAATGTCACAGTAGCAAGTTTACGGTGATG +GAAGTGCCCGGTTAAATAATAAACCACAATCAAGAAAGCAAAGTGAAGGAGCAGTTTCCC +ACCGCCCTCCCCAACAGCCTGCTCAGGCAGAAACACGTGTTCCAGACTTACTATCTTGGG +ATCATTAATGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAG +GATGCGCACCTGAGGAAGGAAACCATGCACAGGTGAGGCAGGGCCCGGCCCGCTGGGCGG +TCGGACTTCCTGAGTGCCCTGCACTGGTTCCCACCTTTCCATCATAGCTCCCAACTGCCA +GGAACTGACTGCTGGGGCTCCAGGCCACAGACTTGATGCCCAGGGACCACTCGTAAGCGC +TGTACGTGGACAACAACCGGCCATCCAATGAGTACAGCAGAATCTTGTACTGCAGATGAG +ACATTTCAGTTAATAATGAATACACCCCCGTCGCCAGGAACACACCACAGACGCGGGTGC +TGCAGAGTGACATTGGTGCAGATAGCACAAAGCTGGCAGGACTGTCCGCGTGGCCGTGGA +AAAGCTGGAACTGCCAGCTAGTACTGAGATAGTCACGGAGAGGCAGTGAGAGCATGAGGA +AAAAGGGGAAATTGGGAGGTCAACCTAATGGCTCGCTGATAAAAGTTCAACTCGGCCGGG +CACTGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAAGCTGGCAGATCACTTG +AACACAGAAGTTCAAGAGCAGTCTGGGCAACACGGTGAAACCCCATCTCTACAAAGAATA +CAAAAATTAGCCGGGCGTGGTGGTGCATGCTTGTGGTCCCAGCTACTTGGGAGGCTGAGG +TAGGAGGATCACTTGAGTCCAGGAGGTCGAGGCTGCAGTGGGCCGTGATCACACCACTGC +ACTCCAGCCTGGGTGACAGAGCAAGACCCTGTCTTTTAAAACAAAGCTCAACTTGTTATC +TGAAATAAGATAAAGCAAACTATATTGCAGCATTCAGAAAGCATGAAATTCCGGGAAAAG +CTCTCGAAAGCAAACATGTCACCTGGTCATCTTCATACCTCCAAGCAGGTGTCCCACACT +GCCAGCACACAGCCGTTTGGGGCCCACTCAATCCCTGTGAGATCCTGGGTGTCCGTATCA +AAATGCTTCCAAAGGAAGGGGGGGAAACATTAAATTTGGAAAATATTTTCGTAAATAAAT +AATTGCATTTATGACTGATGTTCTTAACGCACTTAATTTCCTTATATAGAAATTGACAAA +ATCTCAACAGCTCTATCCTGGAAATGCATGAAATCCCTGTAGAGCTGCTGCTGGGGCTGC +ACCGCCACAGATGCCAGCGTCAGTGCCTGGCCAGCCCCCAAGGGCGGCTTGGTCTCCCCG +CGCCTGCACTCGTGTGCACACTCTCCCCCTCACCTTTCCTTGCCTGGCCAGCCCCCGAGG +GCGGCTTGGTCTCCCCGCGCCTGCACTCGTGTGCACACTCTCCCCCTCACCTTTCCTTGC +CTGGCCAGCCCCCGAAGGTGGCTTGGTCTCCCCGCACCTGCACTCATGTGCACACTCTCC +CCCTCACCTTTCCTTGCCTGGCCAGGCTCACTCCTTTAGACCCAGCTCAGACAAGTCCCT +TCCAGAGCACTGCCTGGATCCCGGGTTCTGCACTCTGACAGCATTCCAGAGGTTGCTCTA +CCTTAATGATGGATTGTGCTGGAATCGTGTTCATATGTCTGCTGTGGGGGCAGTGCCCTC +TGTGCCTGGGCACCTGGCAGAGCGCCCTGCCTAATGCAGGCCCTCAGTCAAGGTGAACTT +CCACGTCCCCCCAACTCCCGACGTGGCACACACATGCGCAAACACCATCACACAGGACAA +GGAAAAGGGCTCAAATGTGACAGCATATTCACTTTTAAAACACCTGGGCACGCGTCCTTT +TCACCAAGTCTCCTGAACACACAACCGGGTGCCACTGGAAGTGATTCGCAGCGCACCTGC +CCTTTGTTAATACAACATCACCTTGCTCCATATCCTACCAAAGATCCCCTGGAATCTGGA +AGGATCTACTTCACTCGATCCCTCCACAGTCAGCAGGACAACTTTATTCCAGTCTGGGGG +ACGCCTTACCCGCAGGAGCTGCCAATCACTGCAGACGAAGATGCTCACGTAATCTTTGCA +GTCGCGCCGTTCTGCCAGCGCCATGTAGCGGCCGTCCCTGGTGAAGGTGATTC +>ENSE00003789737 Reversed: +CGTTCCTTGTCGCCAGGAAGTAGCTGTCAGGACTAAATGCCAGCATTCCTATGCCGATTT +TCGGGTTTGCTCTGTCGGTAACAGGTTTCAGTGTCTGTAAGGAGACTGGGACAGAGGCGA +TCTCAT +>ENSE00001852362 Reversed: +GGGGCTGTGGAACAAGGACGCCCCTGGGCTCCTGGGGAGCGCCTCCTGTGTGCCAGGCTG +CACCTGTCCTGACCCCCATCCTGAGCACACACCGAGCCCCGGGGTGGGCCCGTCGGCACT +TGGGGCACCGCTTCCTCTACCTGCAACCTTCAGATGCCCTCATGCCCCTGTGGGATGGGT +GCTTTTACTATGCCCATTTCAGCGATGAGGAAACAGACACATAGGAAATGCCCAGAGTCA +AGAGGCTGCATCAGAACCGGGCCTCAAGCCGGAGACAGCGCTCGGGAGCACCGCCGGGTT +CCAGACCCACTCTGAGCGCCACCCACGGAAAAGTGTTTCTTTGAAAAACATCATTCTCGG +AGCTCCGGAAAAACATCCCCTCGGAGCTCCCGCTGTCAGATCCGGGTCTCCAGGGCTCAT +ATTCAGTAACAGAAGCCGCACCTTCACGGCCCACTGCGCAATTCAGACCCTAGTCAACCT +CCAGCCAACAGGCTGAGGGGCACACTGGCTGGAAGCATGGAAGGGAAAAAAAGTTTTTTT +TTTTAAACATAAGGAACATCCGAAGTTTATCTGGACAACGAGGAATCTTGCATTAAAAAA +GGAAAACAAATGACATCACATGTGCTACTTACATTTACTCTCTGAGCTCGGGAGAGGGCC +GGCCCCGGCCCGGGGCGGCGGGAAGGAGAGGCAGCCCAGTCCCAGCTGTGGGCTCTTCTC +GGCCTCCTTATACACCAC +>ENSE00001924010 Reversed: +AAACATAAGGAACATCCGAAGTTTATCTGGACAACGAGGAATCTTGCATTAAAAAAGGAA +AACAAATGACATCACATGTGCTACTTACATTTACTCTCTGAGCTCGGGAGAGGGCCGGCC +CCGGCCCGGGGCGGCGGGAAGGAGAGGCAGCCCAGTCCCAGCTGTGGGCTCTTCTCGGCC +TCCTTATACACCAC +>ENSE00001659258 Reversed: +ATTTACTCTCTGAGCTCGGGAGAGGGCCGGCCCCGGCCCGGGGCGGCGGGAAGGAGAGGC +AGCCCAGTCCCAGCTGTGGGCTCTTCTCGGCCTCCTTATACACCAC +>ENSE00001813324 Reversed: +CAAGAAAGCAAAGTGAAGGAGCAGTTTCCCACCGCCCTCCCCAACAGCCTGCTCAGGCAG +AAACACGTGTTCCAGACTTACTATCTTGGGATCATTAATGGCTGCAGGATGCCCAAACTC +CGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCAC +>ENSE00003685083 Reversed: +TATCTTGGGATCATTAATGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCAC +GTGATTAAGGATGCGCAC +>ENSE00003653006 Reversed: +TATCTTGGGATCATTAATGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCAC +GTGATTAAGGATGCGCAC +>ENSE00001866903 Reversed: +TGGCTGCAGGATGCCCAAACTCCGTGATCATTTTCCAAGTCACGTGATTAAGGATGCGCA +C +>ENSE00003492457 Reversed: +CTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTT +GATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTA +CAGCAGAATCTTGTA +>ENSE00001896684 Reversed: +CTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTT +GATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTA +CAGCAGAATCTTGTACTGCAGATGAGACATTTCAGTTAATAATGAATACACCCCCGTCGC +CAGGAACACACCACAGACGCGGGTGCTGCAGAGTGACATTGGTGCAGATAGCACAAAGCT +GGCAGGACTGTCCGCGTGGCCGTGGAAAAGCTGG +>ENSE00003669982 Reversed: +CTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTT +GATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTA +CAGCAGAATCTTGTA +>ENSE00001839399 Reversed: +CTTTCCATCATAGCTCCCAACTGCCAGGAACTGACTGCTGGGGCTCCAGGCCACAGACTT +GATGCCCAGGGACCACTCGTAAGCGCTGTACGTGGACAACAACCGGCCATCCAATGAGTA +CAGCAGAATCTTGTACTGCAGATGAGACATTTCAGTTAATAATGAATACACCCCCGTCGC +CAGGAACACACCACAGACGCGGGTGCTGCAGAGTGACATTGGTGCAGATAGCACAAAGCT +GGCAGGACTGTCCGCGTGGCCGTGGAAAAGCTGGAACTGCCAGCTAGTACT +>ENSE00003387437 Reversed: +AATGAGTACAGCAGAATCTTGTA +>ENSE00003480267 Reversed: +CTCCAAGCAGGTGTCCCACACTGCCAGCACACAGCCGTTTGGGGCCCACTCAATCCCTGT +GAGATCCTGGGTGTCCGTATCAAAATG +>ENSE00003485438 Reversed: +CTCCAAGCAGGTGTCCCACACTGCCAGCACACAGCCGTTTGGGGCCCACTCAATCCCTGT +GAGATCCTGGGTGTCCGTATCAAAATG +>ENSE00001857368 Reversed: +CCGCAGGAGCTGCCAATCACTGCAGACGAAGATGCTCACGTAATCTTTGCAGTCGCGCCG +TTC +>ENSE00000734306 Reversed: +CCGCAGGAGCTGCCAATCACTGCAGACGAAGATGCTCACGTAATCTTTGCAGTCGCGCCG +TTCTGCCAGCGCCATGTAGCGGCCGTCCCTGGTGAAGGTGATTC +>ENSE00000734303 Reversed: +CCTGCAGACAAGCTTTCGGGTATTTGATGTAAGACACGGATTTTGTGCACAAGGACCAGA +CGGTTATCCGCAG +>ENSE00001854631 Reversed: +CCTGCAGACAAGCTTTCGGGTATTTGATGTAAGACACGGATTTTGTGCACAAGGACCAGA +CGGTTATCCGCAGCTGTTGGGGGAAAGGGGAAAGAGAAAGGAAACACTTCTTTAGCATCA +TCAGAGACCGTCTCAATCCTCAACCCGCCCACGCGTCCCCAAGCACAGGCCTGACTGCTG +GAGTGGATCTATCAGGACCTGGGGGATGCCTGCCCTCCTACCGGAATATTCAAATGCGTA +TTTTACTGTGGTTACGGTAAATTTGGTGTTCTTGGTTTTCTGTTGTTGTTGTTTTATACC +AAAATTGAGTGACACAAAGTTAAATCCAAGTGCTTTTTCATTAGCTTTTTCAAAGTGACC +ATAGGTTGCATGTTATAATAACCCTGAGTTACTCAGAGAAAAATCTTGATCTAGAAACCA +CCACGGGTTCAGTCTCCTTTATGGGAAGACAGAGGATCTGGAGATTGGATGCAGCCACTC +CGGGACTCACCAGGGGGCTGTGAGCCTGCATCTGCAGCCCTGAGGCAGGAGCAGCCACTC +AACACCCAAGAAGGTGTCCGTCTGCCTCCTGCGTGTGCTCGCTGGCCTGGCTGCATCTGC +AGAGGGTTCTAGAACATGCGCTGCTGGACTGTCCACTTTTCCACCCCTTTCCCTGACTCA +GGGAGCTGAGAGCTGACTAGGCTGGCACAGTGAGGCCAAAAGATGATTTTCTAACCAGGC +CGACGAGGGCGTGCCTGCTGAGGGAGAGGCACCGCAGTGGGTGGTCCAGCCCTCCCCGTG +GCAGCGCCGCGGGACTTCCAGGGCTGCTGTGTCCCTCCACCTGCATTTCCCACTGAGACC +CCGTGGAGCCTACCAGGGAATCATCTTGCTTCCCAC +>ENSE00000734299 Reversed: +ATGGAATTCCGTGGTGTTGAGAATGTGGCGCCCGTCCGGGCTCCAGCACGAGGCCACCAG +CCCGGCTGAGCCCTCGTCTATTTTGCAGTGCCATTCGGGCTGCTCTAAAGACCAGAC +>ENSE00001931622 Reversed: +TTTAAATGTTCTTAAACTTTAGAGAACGTTATAATTTCAAAAGAAAACTGGCTTTGAGCT +GCACGGACTTTTTTTTCAAACTAGAAAGGCACAGAACAAAACCCCTCCTTCCCAGGGGCC +CTCAGAAGGTGTCCAGATTCTAAGCGACACGGCAGCACACACCTGCACCAGCCCTCGCTT +GTACATGGCGCACAGGATGAAGAGCGAGTCTGCCGACCACTCGATGTGCTGGATCTGGTC +TAGGCACGTGTACAGCTGAAGGATCTGAAGGGTGTTCACATCCCGGACCACTAACCGGTA +CTGGACACAGGAAGC +>ENSE00003566716 Reversed: +CTGCACCAGCCCTCGCTTGTACATGGCGCACAGGATGAAGAGCGAGTCTGCCGACCACTC +GATGTGCTGGATCTGGTCTAGGCACGTGTACAGCTGAAGGATCTGAAGGGTGTTCACATC +CCGGACCACTAACCGGTACTGGACACAGGAAGC +>ENSE00003677298 Reversed: +CTGCACCAGCCCTCGCTTGTACATGGCGCACAGGATGAAGAGCGAGTCTGCCGACCACTC +GATGTGCTGGATCTGGTCTAGGCACGTGTACAGCTGAAGGATCTGAAGGGTGTTCACATC +CCGGACCACTAACCGGTACTGGACACAGGAAGC +>ENSE00001870155 Reversed: +CAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGA +GAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCCTGCGCCCGAAAACCCGCGGGACCC +CTGGGCGC +>ENSE00001477063 Reversed: +CAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGA +GAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCCTGCGCCCGAAAACCCGCGGGACCC +CTGGGCGCGCAGC +>ENSE00001680820 Reversed: +CAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGA +GAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCC +>ENSE00001748742 Reversed: +CAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGA +GAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCCTGCGCCCGAAAACCCGCGGGACCC +CTGGGCGCGCAGCAGGCTGCAAC +>ENSE00001836154 Reversed: +CAGGTACTTGCCGTCCGGGGAGAACTTGCAGAGTAAGCTGGAGAGCTTGAATACCTCGGA +GAAGTTCATGGCCGCCGCCTGCCGCGGGCGCCACCCTGCGCCCGAAAACCCGCGGGACCC +CTGGGCGCGCA +>ENSE00001858739 Reversed: +CTGGGCTCGCAGCTCCGAAGCTGGGAGGTGAGGGGAGAGCGATCGGGGA +>ENSE00001475277 Reversed: +TTTTTTTTTTTTTTTTTTTTTTGAGACGGAGTCTCGCTCTGTCGCCCAGCCTGGAGTGCA +GTGGCGTGATCTCGGCTCACTGCAAGCTCCACCTCCCAGGTTCATGCCATTCTCCTGCCT +CAGCCTCCCGAGTAGCTGGGACCACAGGTGCCCGCCCCCACGCCCGGCTAATTTTTTGTA +TTTATAGTAGAGATGGGGTTTCACCGTGTTAGCCAAGATGGTCTCGATCTCCTGACCTCG +TGATCTGCCCGCCTCGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGCGCCCG +GCCCATCTTAACCATATTTAAGCATCATGCACATTCACATTGCGGTGTAGCCATCAGCAG +CATCCATCTCCAGAGCTCTTTTCCTCTTGCAAAACTGAATCTCTGTACCCATGAAGCACC +AACTCCCCATTCTTCCCACCCCCCAGCCCCTGCCAACCACCATTCTTAGATGTGATATCT +TTGTTAGAGCAGATTAACTTGCTCTCAGGTGTATGGTCTGCGGCCATTGACTCAAGCACA +GGGAATGAGAACTTCTGGAAGTGGGCCTGGACATCTGAATTGCACAGGCTTCCCAGATAG +GTACGAAGGAACAAGAAACAAAACAAACATTACCGCAAATGAAACACTGTGTAAATATGT +GGATTACATCCTGTAAGTACGAAGAGAATGGAAGGCATTTATCTTGTTATTGTCACTGGG +GCAGATCCGGAGTCAGCTCTGGGCGGAGATGGATTTACCCTGGAGCTGCTGAAGCTTAAG +CTGGGGGCTGCTCAGGAGCCTGGATGTAGAGTAGGAAGCAGTTCTGAGCATGGAGGGGAA +GCCAGGTGTGCCAGCCAGAAGCATC +>ENSE00001475269 Reversed: +CACAGGCTTCCCAGATAGGTACGAAGGAACAAGAAACAAAACAAACATTACCGCAAATGA +AACACTGTGTAAATATGTGGATTACATCCTGTAAGTACGAAGAGAATGGAAGGCATTTAT +CTTGTTATTGTCACTGGGGCAGATCCGGAGTCAGCTCTGGGCGGAGATGGATTTACCCTG +GAGCTGCTGAAGCTTAAGCTGGGGGCTGCTCAGGAGCCTGGATGTAGAGTAGGAAGCAGT +TCTGAGCATGGAGGGGAAGCCAGGTGTGCCAGCCAGAAGCATC +>ENSE00001890428 Reversed: +CCGCAAATGAAACACTGTGTAAATATGTGGATTACATCCTGTAAGTACGAAGAGAATGGA +AGGCATTTATCTTGTTATTGTCACTGGGGCAGATCCGGAGTCAGCTCTGGGCGGAGATGG +ATTTACCCTGGAGCTGCTGAAGCTTAAGCTGGGGGCTGCTCAGGAGCCTGGATGTAGAGT +AGGAAGCAGTTCTGAGCATGGAGGGGAAGCCAGGTGTGCCAGCCAGAAGCATC +>ENSE00001475263 Reversed: +TTTTATTGCAGTTCACTTTATTGCACGTCAAGATATTGCCTTTTTTTTTTTTTAAACAAA +TTGAAGGTTCGGGGTAACTCCAGAGTCAAGCAAGTCTATTGGCAACATTTTCCCACGAGC +ATGTGCCCACTTTGTATCTGTGTGTCACACTTTCGCAATTCTTGCAATATTTCAAACTTC +TTCCTTATTATATCTGTTGTGAAGCTGGTTCTCCCAGACGTTCCCTGCAGGCTGTTTATG +CAGCGCCCATCCGAGATGAACCCACAGGACACTCAGGATCCCAGACTGCAGGAGTCGTCT +GGGATCACAGGCGGGGCAGAGCAATTTGTCAATGTTTATGAGGAGTCCTCCTTGGCAGCC +CAGTCTTTATCCTCACTCACGTGGAAATGAGATTCGACCTCTCCTAATCACCTGGTGCCC +GAGGAGCAGGTAGGCGCCTGTCCCAAGCCTGAGTTTCCTGGGAAATCTACATTTCAGCAC +AGATGGGTTCCCAGCAGCTTAGTGCTCTGGCTGTCCTTAGGTCACTGAATCATTTCACCC +GCTAGTTTTTTGTTTGTTTGTTTTTGAGATGGAGTCTTGCTCTGTCACCCAGGCTGGAGT +GCAGTGGCGCGATCTCGGCTCACTGCAACCTCCACCTCCTGGGTTCAACTGATTATCCCT +CCTCAGCCTCCCAAGTAGCTGGGGTTACAGGCACCCGCCGTCATGCCCAGCTAATTTCCA +TATTTTTGTAGAGACGGGGTTTCACCATGTTGGTCAGGCTGGTCTTGAACTCCTGACCTC +AGGTGATCCGCCCACCTTGGTCTCCCGAAGTGCTGGCATTACAGACGTGAGCCACTGCGC +CCGGCCTTGCCCACTGGTTTTATGAGAAAGAGACATGGGAGCCTTTTCCCCAGCTGGGGC +AATCATCAGACAGTCACATGGAGTCACAGAACCATCTTGCAACAGCATCCCAAGACCTGG +CCATTGGGCAGGATGTGGGACTTGTGAAAGGTCATAAATGACCCTTTGAATCAGTCTCCC +TCTGCACAGGAAAAGCCCACCGCCCTGCGTTCACCTTTGCCCATCAGATAGGGCTTGGGG +GGCACCTGAGGAGGAGGTGCCTGCCACTGCCTGTGGAGGAGGATGTTGGCGTTCCTATTT +CACAAGCCCGGCTTGGAGAGCCAGCGGAGACCTTCTGCGCAGCTAGCTCTTGCACACACC +CCTGCGGAGAAACTCTGCCTTCTTGCCTGGGGCCCAGAACCTTACCCACCCAGGCTTGCC +CCCTCCCTTCCAGGGCCCACTGACCTCCTGACTCAGGCTCCCCCGAGTGCCTGACCCTGT +GAGTCACTGGCCCATCTACAATCCTTCTCCCCGTGACTGCTTGAGTTGTAGCTTGATTGG +AGCCAGGTCAATGCAAGTCACAGAACTGCGAACTGAGATGGACTCTCAGAAGCAAGAGGT +GGCAAGCATGGCGGAGAGGAAGCGAGGGTCCTCCTGGCTGGTTAGATCTTACAGAGTTTA +AGCTGTACTGAGAGTTTTTATGAGGACAAGGGGCCAGTCCTGTGCCTGCCTGATGTGGAG +TCCTAGGCGGGCTTGGGCCGCAGGTTACCTGCTCCCGGAGGCTCACAAAGGCAGTGCCAA +CAGGCGCTCATTCTCAGCAATGGGTGAAAGTAAGAGGAACCTGCCCTCCCTCCTCTCCAC +ACCTCCCCAGTATTTGTCCTCATGGAGTAAATATCCAACAGTGATCCCAGGGCATGGGAG +TGGGAGTTAAGGCAAATGCCAGACTGTCCAAGGCTCATTACAGGGTAGTCCTCTCATCCT +CTGCTCACTAGTCCACTATATTCAGTGAGCACCCACTGTGCACCCTGTGCCTTGGGGACG +TGGAGGCACGCTCAGCCCCAGCCTCGCCCTCCGGGAGCTTACAGTCTAACCCTCTGGGCA +CAGGGAGGTGGGAAGATGGCACGGCCTTGCTGGGAGCCTCACCCTGTTGGCTGAACAATG +ATTTTTTCAATAATGCCTACAGCTTCCTTCATATCCTGCCACCCAAACCAGTGCCAAGGT +CATCATGGGCTTGTGTGGCACAGTCAGATTTAGTGACCATCCCCACTCCCACATTGGTTC +TGTCTTCTTGCCCCCGGTGCTCTGGTCCCTAGCACAGGCTGCTGATTTGGGGACTCGGGG +GAGAATCCTCCACCTTCTGCAAATGCTTAGCCATGAAATGACGGGTGTTTGCCTGACTAT +GATTTCATGAATCCCCCATGAAATGATGGGTGTTTGCCTGATTATGGGCCAACAGTGCCC +CCCACTCCTCGTGGGCACTCCTGGGATCAGCAGCCCCTTCCTAGCCTTCACAGGGACTCT +AGGCCTCCATGGAAAAGAAAGAAATAAAAAATTTTTTTTGAGACAGAGTCTTGCTGTGTC +ACCCAGGCTGGAGAGCAATGGCTCAATCTTGGCTCACTGCAACTTCAGCCTCCGAGGTTC +AAGTGATTCTCTTGCCTCAGCCTCCCGAGTAGCTGGCACATGCCACCACACCCGGCTAAT +TTTTGTATTTTTAGTAGAGACGGGGTTTCACCATATTGGCTAAGCTGGTCTCGAACTCCT +GACCTCAGGTGATCCACCCGCCTTGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCA +CCGCGCCCGCCCAGAAAGAAAAATCTTAACAAGTTGCTTCCAGTAACCAGTCTCAATGAG +TAGCAGGGAGTAGTTTGCAAGAAAAAAAAACAAGTGAAGATGTTTCCCATTCTTTAACCT +GCTCCATCCCTCAAATTCCTGCTGCTCCATGGCAGGGGCCCTGCTCACCCCACATTGGCA +CAGACTCTGCTGGAGTCAGATCCTCCAAAGCCACAAGCTTCCTTGAGGCCACGGGGCCGC +CTCATTCTTGTTCTGCCCCTTCCTCACACTGAAAGACTGCATAGCCTGGGGTGCAATGCC +CAGGTGTGAAATTGATGCTCGGGAAAACAAATCCTTCCCAAAGTCACTTAAGGAATCCCC +CAGCCCCACCGCACAGACCCCTGGATGTATACTGCCCCTATAATTCTGCTCTAGGCAGAA +AAGCCTAGGAGTGGAGGTGACAGCTCCCAGCATATGCACCCTTTTGCTCTGCTCTGCTGC +CCTGTAGAGCCCTGGAAGTGACCAGAGCCCTTAGGCTACTGCTGCTGCATGCCCAGAGGG +TCCCAAGCAGAGCTGGGCAGGAGGTAGGCCCAGGCAGGGCTGGGAGAGCAGTGACCAGGC +AGGGTGCACGGCTGCACTTTGCCCAGGTCCTGGCTCTGGCTCTGGTCTGGTGCCAGTGCT +GGGGTGGGTGTGTCGGCTGCCCACGCAGCTGCGGGGTCCAGTTCCAGAACTATCTCCACC +AGCTGGGATGGGGGGCTTCTTCTTCACCCTGCTGCCTCTTGTCCTTTCTTCTCCAGCCAA +GTTGGGGGTGAAGCAGGGACGCTCCTTTTATTCCCTGAGCCGAGCCCCAGCCCCAGGGCT +TTCAGTCTGCCACGCCAGTCACAAACAGCCGGCTTCCGGCCTGGGTGTGGGTACTGGGCT +GGCCCCTAATGATGGGAACAGCAGCCGCCACCAAGAGCTTCAACCTGTCCAGTGCCCCAA +GGTCCCAAGCAGTCGGCAGGGTCTGTGGATCGGCCGAGGGGCTACCACGGCCGCCAGAGG +CCAGGGCCGCAGGGAGGCGAGGGCGGCGAGGGCACCGGAGCGGATGCGGGCTCTGGGGCA +GACGCGGGCGCTGGGGCGGGGGCAGACGGGCCACTGGAATCCCCAGCGCGCCCGCCGTCC +AGGGTGGCGCTGGCCGCTCTCCGCCACAGGTGCTCCAGCAGGCGCGCGCTCACGGCGGGC +TCCAGGACACGGCAGGCGGGCAGCACGCGGGCCAGGCGCGCCACACAGGCGCTGTAGCCC +TCGCGGTAGCTGTCGCAAGGCA +>ENSE00001948071 Reversed: +CTCCTGACTCAGGCTCCCCCGAGTGCCTGACCCTGTGAGTCACTGGCCCATCTACAATCC +TTCTCCCCGTGACTGCTTGAGTTGTAGCTTGATTGGAGCCAGGTCAATGCAAGTCA +>ENSE00001854189 Reversed: +CCAAGCAGAGCTGGGCAGGAGGTAGGCCCAGGCAGGGCTGGGAGAGCAGTGACCAGGCAG +GGTGCACGGCTGCACTTTGCCCAGGTCCTGGCTCTGGCTCTGGTCTGGTGCCAGTGCTGG +GGTGGGTGTGTCGGCTGCCCACGCAGCTGCGGGGTCCAGTTCCAGAACTATCTCCACCAG +CTGGGATGGGGGGCTTCTTCTTCACCCTGCTGCCTCTTGTCCTTTCTTCTCCAGCCAAGT +TGGGGGTGAAGCAGGGACGCTCCTTTTATTCCCTGAGCCGAGCCCCAGCCCCAGGGCTTT +CAGTCTGCCACGCCAGTCACAAACAGCCGGCTTCCGGCCTGGGTGTGGGTACTGGGCTGG +CCCCTAATGATGGGAACAGCAGCCGCCACCAAGAGCTTCAACCTGTCCAGTGCCCCAAGG +TCCCAAGCAGTCGGCAGGGTCTGTGGATCGGCCGAGGGGCTACCACGGCCGCCAGAGGCC +AGGGCCGCAGGGAGGCGAGGGCGGCGAGGGCACCGGAGCGGATGCGGGCTCTGGGGCAGA +CGCGGGCGCTGGGGCGGGGGCAGACGGGCCACTGGAATCCCCAGCGCGCCCGCCGTCCAG +GGTGGCGCTGGCCGCTCTCCGCCACAGGTGCTCCAGCAGGCGCGCGCTCACGGCGGGCTC +CAGGACACGGCAGGCGGGCAGCACGCGGGCCAGGCGCGCCACACAGGCGCTGTAGCCCTC +GCGGTAGCTGTCGCAAGGCA +>ENSE00001914446 Reversed: +AGGGTCTGTGGATCGGCCGAGGGGCTACCACGGCCGCCAGAGGCCAGGGCCGCAGGGAGG +CGAGGGCGGCGAGGGCACCGGAGCGGATGCGGGCTCTGGGGCAGACGCGGGCGCTGGGGC +GGGGGCAGACGGGCCACTGGAATCCCCAGCGCGCCCGCCGTCCAGGGTGGCGCTGGCCGC +TCTCCGCCACAGGTGCTCCAGCAGGCGCGCGCTCACGGCGGGCTCCAGGACACGGCAGGC +GGGCAGCACGCGGGCCAGGCGCGCCACACAGGCGCTGTAGCCCTCGCGGTAGCTGTCGCA +AGGCACTGCGGGCGGAGAGCCGCGTGAGGCGCGGGGTAGGGTGCCGGGTGCGGGGTGCAG +AGCGCGCGGCAGGGCAGGGAGGGCTCACTCACGGGGCGCTGCCGTGGGCCATGAGGACGC +AGGCAGCTCCTGCAGGAAGCGCACGGTCATTTCCAGGACGTCTGCCTTCTCTAGCTTCGA +GCAGTTGGAGTT +>ENSE00000734533 Reversed: +GGGGCGCTGCCGTGGGCCATGAGGACGCAGGCAGCTCCTGCAGGAAGCGCACGGTCATTT +CCAGGACGTCTGCCTTCTCTAGCTTCGAGCAGTTGGAGTT +>ENSE00002817476 Reversed: +CTCCCGGCCCAGCAGCGGCAGGATGAGCCCCTTAAGCTGGCTCAGGCTCTGGTTGATGCG +CGCGCGCCGGCGCTTCTCCAGCAGCGGCTTCAGGCT +>ENSE00001916716 Reversed: +CTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGC +GGTGGCAGCTGCGAGCCCCACGCAAAGGGAAACCGAGGTCCGAAATGAGGTCCCGGGCGC +GGCCCGGGCTGG +>ENSE00001475267 Reversed: +CTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGC +GGTGGCAGCTGCGAGCCCCACGCAAAGGGAAACCGAGGTCCGAAATGAGGTCCCGGGCGC +GGCCCGGGCTGGTGCCAGACGAGT +>ENSE00001475271 Reversed: +CTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGC +GGTGGCAGCTGCGAGCCCCACGCAAAGGGAAACCGAGGTCCGAAATGAGGTCCCGGGCGC +GGCCCGGG +>ENSE00001835288 Reversed: +CTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGC +GGTGGCAGCTGCGAGCCCCACGCAAAGGGAAACCGAGGTCCGAAATGAGGTCCCGGGCGC +GGCCCGGGCTGGTGCCAGACGA +>ENSE00001475281 Reversed: +CTTGCGCAGCTCCGCCGCGTCCCCTGCCCGGCGAGGCAGCCCCATGCTCCGCGGGGAAGC +GGTGGCAG +>ENSE00001150483 Reversed: +CTCTGGAATTGCGTCGCCGGCGCCTGGAACCGCAGTTAGCGGGCACTGGGCAGATGAATG +AATTTGTCTGTGCCTGGACGGCTCTCCAATTCGAACCCAGTTTTGCTGCCCTCTGGGGTC +TCAACTGTTACGTGAGGCAAATTAGGAGAGAAGCCCCTGGGCACCTTGCCCCAGTCGCAC +GAGTGTCCCCGCG +>ENSE00003790229 Reversed: +TTACATTTTTAATAGACTTTTATTTTGGAATAATTGTAGATTTACAGAAAAGCTGCAAAG +AATAGTACAGAGAGTTCCCTCAAATTCTTCGCCCAGTTTCCTCTAACATTTGCATCTTAC +ACAGCCATGGCACATTTGTCAAAACTAAGAAATTAACACTGGTATTACTTTTAACTAAAG +GCTTTTTTGGATTTTACCAGTTTTTTCACTCATGCCTTGTTTTGTTCCAAAATCCAACCC +AGGATATCACACTGCATTTAATCAAATGTAAATACGTATGCTTTAACTTTTTTATTTTAA +AATAATCATAGATTTACAGGAAATTGCAACAACAACAAAAAAAGTACAGAGATTCTGTGT +ACCCTTCCCCCAGTTTCGTTCAGTGGTAACTCCTTGTATAACTACACAATATCAAAACCA +TGAAATAGATATTGGCACAATCCATAGACAGTATTAAATATACATGCATATATATATATT +TTTAAGTGAAAAATATTTTTAAACCTCGCTTTGCCTCACAGCCAAGAAGATCAAATACTT +TCTCCAAAAACATAGAATTTGTATCTAACTCCACTCGCTCCAAACTCAAGTCCAACCATG +AAATTATTGATCCCTCTCTCTAACCCTCCAACTACAGGCAAGAAGCTGCCCATACATTCC +CCAAAGCAGGAGTGCACTCTGCCACAGGCCTAGATGCCGTCAACCTCCTGGACCTTGAAC +TCCCTAAATTAATGGCCTCTGTGTGAGTATGTGTAAGCAGCCCCTCTCTGTCCCAGTCCA +TCCTAAAATCACTCCCTTGGAGCCACCACTGCCCCTCTCATCTTCTAGAATTTCTAGAAA +GATAAAGAGCTAGATAAGCATCTAGGTACCTTTCTTCTGCTGTTAGCTCTAAAGACAAGT +GAATATATCCTAGCTAGGATGTACTCTAAGGAATGCAGAAGTAGGCCGAGTGCAGTGGCT +CATTCCTGTAATCCCAGTGCTTTGGGAGGCCGAGGTGGGCGGATCACCTGAGGTCAGGAG +TTTGAGTCCAGCCTGGTCAACATGGCAAAGCCCCGTCTCTACTAAAAATACAAAAATTAG +CTGGGCGTGGTGGCGGGTGCCTGTAATCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATC +ACTTGAACCCCCAAGGCAGAGGTTGCAGTGAGCTGAGATGGTACCACTGCCCATTTCAAA +AAAAAAAAAAAAAGAATGCAGAAGTAAATTAAATGACCACAAAGAGTTTTTTTTAATTTG +AGACAGGGTCTGGCTCTGTCACCTAGGCTGGAATACAGTGGCGCAATCTCAGCTCACTTC +AATCTGTGCCTCCTGGGCTCAAGCCATCCCCTGACCTCAGCCTCCTGAGTAGCTGGGACT +ACAGTCCTGCCACTATGCCTGGCTAATTTTTGTATTTTTTGTAGAGATGTTGCCCAGGCT +GGTCTGAAACTCCTGAGCTCAAGGGATCCATCCACCTGGGCCTCCCCAAGTGCTGGGATT +ACAGGCATGCGCCACCGTGCCCAACCCAGACATCACTTTTATCTGAAGCAACAACTATCT +GCTCTTTCTGTTTCCTTACTAATTATCCAGGAACTTTTACAGGTGAACTCTGAGGAGGAC +AATTTTTATTGTTTTTATGTCAGCATAACTAAAAGTAAAGCTGGATAGGAAGAGGTTACT +TGAAAATGATTTCACCTGAACTCAAATGAATAAGCTGGCTACTGCATAAAGCAACAGAGG +GGTCCCTTTAATTTAAAAGCTCAGGACTCTGAATCAATTGCTGGTTGGGAGAAGGTAGAG +ACATTCTTTACTTCTGCCTAGAACTGGGGAAAATGGCGTAGACTTCTGCTCTGAAGCAGT +CCTCAGTGCTGCTTCGGTCAGAACTCCCGAGAGGCATCTGAGTGCTGGCCTGTCACTGCG +GCTGGCATTCCAGGCATTTCATTGGCCCCACTTCAGCCCACGCCTGGCTCCACGGGGCTG +GGCAGCTGAGGGGAGTTTGTGGCAGAGTGGGCATGGGGCACGGCCCGTGCAATGTGCGTT +ACAAAGGGGCTCTCTCTGAAGCAAGTCCTCTGCACTCCAGTCTATTTGAGGAAGAAAAGG +ACAATTCCCATAGGGAGGGGGTTTGCTGAAGCAACCAGCTGCCTGGTTTCCTCTCCAGCA +TTGAGAGGGAGGGAGGGCTGGCTTAACTGGGGGACGGCCTTCTCATCTGGACTGTGTCAA +GGCCAAGGTTAGGCTCCAAATTCCAGAAAACCTCTCTGCAGGGTCTTCTTTCAGAGTGGT +GAGAATGGAAGCAGGCTCCCTTCCCCTCCAGCACTAGGAAGCCCCGCAATTGGTGAGGTG +CAAAGAAAGATGGGCCCAGGCAGGGAGGCGGGAGCAGGGGAGGTGCCCAGGGCAGTGGCT +GGAAGGGCAACGGGAGAAGCAGCAGAGGCTGGGGGTGGGGGTCGCAGCAGGTGCTGTCCC +TGGCCTGTGTGAAAGGTACTAGAAGGCCCCATCCTTGGTGCCACATGGACCCCAGAGGCT +TGTCTTAGTCCATGGGGTCCGAGGTGTAAGACACTTACGTTTGGCGTCACCTCTTAGGCT +TGGATGAATTTCAGAAAGTGCTAGACTGGAGAACAGTGGAAAAAATCAGTGGAACAAGAT +CTGGAGCACTCACTGCTCAATGTCAATGTTAGAGAGCACAACGACACCAATGGGAGGAGG +GTGAGGACCAGAGGCTGATTGCATGAGCTCTGTTGGAGTGCAGGACCCACTAACGGGTTA +TCTCAGGGTTCCTGGAGGCCACGGCTGTGCCTTGTGGTCCAAGACCTGGGGAAGCCACCA +CTGTGTCTTCCCTCTCCATCCTCCGGTGACTTTGGTCCAATTCCTGTTGCCATGGCAATC +AGCCCAGCTGGCCTCACAGTTCACTGGCCTCAAAGTTGGCATCTGTAGGTGAAGCCAGTG +GGACCCAGAGAACTTAATTCTTCTCAACTGAGCTGGCTTGGAGGAACTTTTCTCATCAGC +CACTGGAGCAGAGAACGTCACCAGCGTCTCACTGACGTCAACATCCTGGGCCTGGCTCTA +GCTGAAAAGGAAAATTCTCCCCAAGGCAGACACATCTCCCGAAGCCCACACAGGCACTTT +CTATGATTGCACTGGAAATCTGTCTCCTGGGGACAGGGAGCGCGTACGCTCACAGTCAAG +TCACAATGTTGAGCAGTCTCCAGGACTCCACGTTCATCTCTAAGAACAGGAGCCGGTGGT +TGGGCGCAGATTCTTGAGCCAGATTGCTCGCGTTCAAAACCTGGTCCCTTTTTATTAATT +GCATGCTTAGTTACATTTTCTGTTTGTACTTTTGTTTCCTTCTCTGCAAGACGGGGTTAA +TCACAGACACTTGTACATGATGTAATACACTTACAATACTTAGGACAGGCCTTCCTGCAT +AGTAAGTGCTCTGCAAACACTGGCTACTATTCTCCCTACGTGCAAACTTCTCCCAGCCAA +AAGCCGCCCACACCAAGCCCCTGTGCCTTTTTCCTTCCGCACCCACGAGCAGGCTGCTCC +TGGGGCCCTGGAGCTCACTTTCCCAGCCGCCCTCACCACCCACCGTGGCGCAGAAGAGCT +TCCGAAGTCCTGGCGTCTCCCACTGGTCTGGGCATCTCTCGCTTCATCTTCCCTCTTGGG +CCCCACAACGTGCAGCACTTCTAGGGCAGTATACTTGCTGATTGCTTCCTTACTATTGCT +CACAACAACCAGCTAAGACACTGCCAAAGAAACACTCACAGCTGGCCGGTCCACGGCATC +CGGAGGGGACTCGGGGGACAGGCCTGTCCTGCCTCTCCCCAGCAC +>ENSE00001500136 Reversed: +GGGCCCCACAACGTGCAGCACTTCTAGGGCAGTATACTTGCTGATTGCTTCCTTACTATT +GCTCACAACAACCAGCTAAGACACTGCCAAAGAAACACTCACAGCTGGCC +>ENSE00003787977 Reversed: +CTGGGTGCATGCTGGGACGGGGCGAGCAGGTAGTGCAGGCTTCCAGGCCTCTCCTGCCCC +GGAGCTTGGCTGCAGGACTCCCGCAAAATCTCCAAATGCCCCCGATCTGCGTGGTCACCG +AGAAGCAGCCCGGCTCGGAACAAGCCCAGGCAAGCCCAGGCAGAGCCCGCCGCCGGGTCC +TCCTTCCTGCTCGTGCCACCAGGCCCCGGGGCCGCGACGCGTCTCTCCAGCCCGGGATCC +GGGGAGCTGGGCTGTCCCCAGACCGACGGGACAGCGGCATCTCCTCCACCTGAAAAGGAA +AGAGGACCAGGTGGGGGCCAGGCAGGGCGCATGAAGGCGGCGCCAGCACCGCGCGATCCG +AATCACGTCGGTGCGGGGGAGGGGTC +>ENSE00001658885 Reversed: +CTGGGTGCATGCTGGGACGGGGCGAGCAGGTAGTGCAGGCTTCCAGGCCTCTCCTGCCCC +GGAGCTTGGCTGCAGGACTCCCGCAAAATCTCCAAATGCCCCCGATCTGCGTGGTCACCG +AGAAGCAGCCCGGCTCGGAACAAGCCCAGGCAAGCCCAGGCAGAGCCCGCCGCCGGGTCC +TCCTTCCTGCTCGTGCCACCAGGCCCCGGGGCCGCGACGCGTCTCTCCAGCCCGGGATCC +GGGGAGCTGGGCTGTCCCCAGACCGACGGGACAGCGGCATCTCCTCCAC +>ENSE00001670416 Reversed: +AGTTTGCAGGACTCCGAACTGGGCCCGCGAGATCTCCACCTGCGCAAAACGAAAGGGCGG +ATTCTCCTTGGACTCACGAGGCAACCGCTCCCCGGGGTGAGAACGGGGGACTCATTCCTC diff --git a/pygtftk/data/simple/simple.fa.fai b/pygtftk/data/simple/simple.fa.fai deleted file mode 100644 index bc727746..00000000 --- a/pygtftk/data/simple/simple.fa.fai +++ /dev/null @@ -1 +0,0 @@ -chr1 300 6 300 301 diff --git a/pygtftk/data/simple/simple_peaks.bed6 b/pygtftk/data/simple/simple_peaks.bed6 index b7938e33..523b4bec 100644 --- a/pygtftk/data/simple/simple_peaks.bed6 +++ b/pygtftk/data/simple/simple_peaks.bed6 @@ -1,6 +1,6 @@ -chr1 11 14 peak_1 0 + -chr1 17 20 peak_2 0 + -chr1 22 25 peak_3 0 + -chr1 37 40 peak_4 0 + -chr1 68 70 peak_5 0 + -chr1 42 45 peak_6 0 + +chr1 11 14 peak_1 . + +chr1 17 20 peak_2 . + +chr1 22 25 peak_3 . + +chr1 37 40 peak_4 . + +chr1 68 70 peak_5 . + +chr1 42 45 peak_6 . + diff --git a/pygtftk/data/simple_06/simple_06.gtf b/pygtftk/data/simple_06/simple_06.gtf new file mode 100644 index 00000000..d3aa5a72 --- /dev/null +++ b/pygtftk/data/simple_06/simple_06.gtf @@ -0,0 +1,96 @@ +chr1 gtftk gene 125 140 . + . gene_id "G0001"; +chr1 gtftk transcript 125 138 . + . gene_id "G0001"; transcript_id "G0001T002"; +chr1 gtftk exon 125 138 . + . gene_id "G0001"; transcript_id "G0001T002"; exon_id "G0001T002E001"; +chr1 gtftk CDS 125 130 . + . gene_id "G0001"; transcript_id "G0001T002"; ccds_id "CDS_G0001T002"; +chr1 gtftk transcript 125 140 . + . gene_id "G0001"; transcript_id "G0001T001"; +chr1 gtftk exon 125 140 . + . gene_id "G0001"; transcript_id "G0001T001"; exon_id "G0001T001E001"; +chr1 gtftk CDS 130 132 . + . gene_id "G0001"; transcript_id "G0001T001"; ccds_id "CDS_G0001T001"; +chr1 gtftk gene 180 189 . + . gene_id "G0002"; +chr1 gtftk transcript 180 189 . + . gene_id "G0002"; transcript_id "G0002T001"; +chr1 gtftk exon 180 189 . + . gene_id "G0002"; transcript_id "G0002T001"; exon_id "G0002T001E001"; +chr1 gtftk CDS 180 182 . + . gene_id "G0002"; transcript_id "G0002T001"; ccds_id "CDS_G0002T001"; +chr1 gtftk transcript 180 189 . + . gene_id "G0002"; transcript_id "G0002T002"; +chr1 gtftk exon 181 189 . + . gene_id "G0002"; transcript_id "G0002T002"; exon_id "G0002T002E002"; +chr1 gtftk CDS 180 182 . + . gene_id "G0002"; transcript_id "G0002T002"; ccds_id "CDS_G0002T002"; +chr1 gtftk gene 50 70 . - . gene_id "G0003"; +chr1 gtftk transcript 50 61 . - . gene_id "G0003"; transcript_id "G0003T001"; +chr1 gtftk exon 50 54 . - . gene_id "G0003"; transcript_id "G0003T001"; exon_id "G0003T001E001"; +chr1 gtftk exon 57 61 . - . gene_id "G0003"; transcript_id "G0003T001"; exon_id "G0003T001E002"; +chr1 gtftk CDS 50 52 . - . gene_id "G0003"; transcript_id "G0003T001"; ccds_id "CDS_G0003T001"; +chr1 gtftk transcript 54 58 . - . gene_id "G0003"; transcript_id "G0003T002"; +chr1 gtftk exon 54 58 . - . gene_id "G0003"; transcript_id "G0003T002"; exon_id "G0003T002E001"; +chr1 gtftk CDS 54 55 . - . gene_id "G0003"; transcript_id "G0003T002"; ccds_id "CDS_G0003T002"; +chr1 gtftk transcript 54 55 . - . gene_id "G0003"; transcript_id "G0003T003"; +chr1 gtftk exon 54 54 . - . gene_id "G0003"; transcript_id "G0003T003"; exon_id "G0003T003E001"; +chr1 gtftk CDS 54 55 . - . gene_id "G0003"; transcript_id "G0003T003"; ccds_id "CDS_G0003T003"; +chr1 gtftk transcript 54 70 . - . gene_id "G0003"; transcript_id "G0003T004"; +chr1 gtftk exon 54 70 . - . gene_id "G0003"; transcript_id "G0003T004"; exon_id "G0003T004E001"; +chr1 gtftk CDS 54 55 . - . gene_id "G0003"; transcript_id "G0003T004"; ccds_id "CDS_G0003T004"; +chr1 gtftk gene 56 76 . + . gene_id "G0004"; +chr1 gtftk transcript 65 76 . + . gene_id "G0004"; transcript_id "G0004T001"; +chr1 gtftk exon 65 68 . + . gene_id "G0004"; transcript_id "G0004T001"; exon_id "G0004T001E001"; +chr1 gtftk CDS 65 67 . + . gene_id "G0004"; transcript_id "G0004T001"; ccds_id "CDS_G0004T001"; +chr1 gtftk exon 71 71 . + . gene_id "G0004"; transcript_id "G0004T001"; exon_id "G0004T001E002"; +chr1 gtftk exon 74 76 . + . gene_id "G0004"; transcript_id "G0004T001"; exon_id "G0004T001E003"; +chr1 gtftk transcript 66 76 . + . gene_id "G0004"; transcript_id "G0004T002"; +chr1 gtftk exon 66 68 . + . gene_id "G0004"; transcript_id "G0004T002"; exon_id "G0004T002E001"; +chr1 gtftk exon 71 71 . + . gene_id "G0004"; transcript_id "G0004T002"; exon_id "G0004T002E002"; +chr1 gtftk exon 74 76 . + . gene_id "G0004"; transcript_id "G0004T002"; exon_id "G0004T002E003"; +chr1 gtftk CDS 66 68 . + . gene_id "G0004"; transcript_id "G0004T002"; ccds_id "CDS_G0004T002"; +chr1 gtftk CDS 71 71 . + . gene_id "G0004"; transcript_id "G0004T002"; ccds_id "CDS_G0004T002"; +chr1 gtftk CDS 74 75 . + . gene_id "G0004"; transcript_id "G0004T002"; ccds_id "CDS_G0004T002"; +chr1 gtftk transcript 68 76 . + . gene_id "G0004"; transcript_id "G0004T003"; +chr1 gtftk exon 68 68 . + . gene_id "G0004"; transcript_id "G0004T003"; exon_id "G0004T003E001"; +chr1 gtftk CDS 68 67 . + . gene_id "G0004"; transcript_id "G0004T003"; ccds_id "CDS_G0004T003"; +chr1 gtftk exon 71 71 . + . gene_id "G0004"; transcript_id "G0004T003"; exon_id "G0004T003E002"; +chr1 gtftk exon 74 76 . + . gene_id "G0004"; transcript_id "G0004T003"; exon_id "G0004T003E003"; +chr1 gtftk transcript 56 76 . + . gene_id "G0004"; transcript_id "G0004T004"; +chr1 gtftk exon 56 68 . + . gene_id "G0004"; transcript_id "G0004T004"; exon_id "G0004T004E001"; +chr1 gtftk CDS 56 67 . + . gene_id "G0004"; transcript_id "G0004T004"; ccds_id "CDS_G0004T004"; +chr1 gtftk exon 71 71 . + . gene_id "G0004"; transcript_id "G0004T004"; exon_id "G0004T004E002"; +chr1 gtftk exon 74 76 . + . gene_id "G0004"; transcript_id "G0004T004"; exon_id "G0004T004E003"; +chr1 gtftk gene 33 47 . - . gene_id "G0005"; +chr1 gtftk transcript 33 47 . - . gene_id "G0005"; transcript_id "G0005T001"; +chr1 gtftk exon 33 35 . - . gene_id "G0005"; transcript_id "G0005T001"; exon_id "G0005T001E001"; +chr1 gtftk exon 42 47 . - . gene_id "G0005"; transcript_id "G0005T001"; exon_id "G0005T001E002"; +chr1 gtftk CDS 43 45 . - . gene_id "G0005"; transcript_id "G0005T001"; ccds_id "CDS_G0005T001"; +chr1 gtftk gene 22 35 . - . gene_id "G0006"; +chr1 gtftk transcript 22 35 . - . gene_id "G0006"; transcript_id "G0006T001"; +chr1 gtftk exon 22 25 . - . gene_id "G0006"; transcript_id "G0006T001"; exon_id "G0006T001E001"; +chr1 gtftk exon 28 30 . - . gene_id "G0006"; transcript_id "G0006T001"; exon_id "G0006T001E002"; +chr1 gtftk exon 33 35 . - . gene_id "G0006"; transcript_id "G0006T001"; exon_id "G0006T001E003"; +chr1 gtftk CDS 22 25 . - . gene_id "G0006"; transcript_id "G0006T001"; ccds_id "CDS_G0006T001"; +chr1 gtftk CDS 28 30 . - . gene_id "G0006"; transcript_id "G0006T001"; ccds_id "CDS_G0006T001"; +chr1 gtftk CDS 33 34 . - . gene_id "G0006"; transcript_id "G0006T001"; ccds_id "CDS_G0006T001"; +chr1 gtftk transcript 28 35 . - . gene_id "G0006"; transcript_id "G0006T002"; +chr1 gtftk exon 28 30 . - . gene_id "G0006"; transcript_id "G0006T002"; exon_id "G0006T002E001"; +chr1 gtftk exon 33 35 . - . gene_id "G0006"; transcript_id "G0006T002"; exon_id "G0006T002E002"; +chr1 gtftk CDS 29 30 . - . gene_id "G0006"; transcript_id "G0006T002"; ccds_id "CDS_G0006T002"; +chr1 gtftk CDS 33 33 . - . gene_id "G0006"; transcript_id "G0006T002"; ccds_id "CDS_G0006T002"; +chr1 gtftk gene 107 116 . + . gene_id "G0007"; +chr1 gtftk transcript 107 116 . + . gene_id "G0007"; transcript_id "G0007T001"; +chr1 gtftk exon 107 116 . + . gene_id "G0007"; transcript_id "G0007T001"; exon_id "G0007T001E001"; +chr1 gtftk CDS 112 114 . + . gene_id "G0007"; transcript_id "G0007T001"; ccds_id "CDS_G0007T001"; +chr1 gtftk transcript 107 116 . + . gene_id "G0007"; transcript_id "G0007T002"; +chr1 gtftk exon 107 116 . + . gene_id "G0007"; transcript_id "G0007T002"; exon_id "G0007T002E001"; +chr1 gtftk CDS 110 115 . + . gene_id "G0007"; transcript_id "G0007T002"; ccds_id "CDS_G0007T002"; +chr1 gtftk gene 210 233 . - . gene_id "G0008"; +chr1 gtftk transcript 210 222 . - . gene_id "G0008"; transcript_id "G0008T001"; +chr1 gtftk exon 210 214 . - . gene_id "G0008"; transcript_id "G0008T001"; exon_id "G0008T001E001"; +chr1 gtftk exon 220 222 . - . gene_id "G0008"; transcript_id "G0008T001"; exon_id "G0008T001E002"; +chr1 gtftk CDS 211 213 . - . gene_id "G0008"; transcript_id "G0008T001"; ccds_id "CDS_G0008T001"; +chr1 gtftk transcript 222 233 . + . gene_id "G0008"; transcript_id "G0008T002"; +chr1 gtftk exon 222 226 . + . gene_id "G0008"; transcript_id "G0008T002"; exon_id "G0008T002E001"; +chr1 gtftk exon 228 233 . + . gene_id "G0008"; transcript_id "G0008T002"; exon_id "G0008T002E002"; +chr1 gtftk CDS 222 223 . + . gene_id "G0008"; transcript_id "G0008T002"; ccds_id "CDS_G0008T002"; +chr1 gtftk gene 3 14 . - . gene_id "G0009"; +chr1 gtftk transcript 3 14 . - . gene_id "G0009"; transcript_id "G0009T002"; +chr1 gtftk exon 3 14 . - . gene_id "G0009"; transcript_id "G0009T002"; exon_id "G0009T002E001"; +chr1 gtftk CDS 5 10 . - . gene_id "G0009"; transcript_id "G0009T002"; ccds_id "CDS_G0009T002"; +chr1 gtftk transcript 3 14 . + . gene_id "G0009"; transcript_id "G0009T001"; +chr1 gtftk exon 3 14 . + . gene_id "G0009"; transcript_id "G0009T001"; exon_id "G0009T001E001"; +chr1 gtftk CDS 3 8 . + . gene_id "G0009"; transcript_id "G0009T001"; ccds_id "CDS_G0009T001"; +chr1 gtftk gene 176 186 . + . gene_id "G0010"; +chr1 gtftk transcript 176 186 . + . gene_id "G0010"; transcript_id "G0010T001"; +chr1 gtftk exon 176 186 . + . gene_id "G0010"; transcript_id "G0010T001"; exon_id "G0010T001E001"; +chr1 gtftk CDS 184 186 . + . gene_id "G0010"; transcript_id "G0010T001"; ccds_id "CDS_G0010T001"; diff --git a/pygtftk/fasta_interface.py b/pygtftk/fasta_interface.py index 81cd8621..80c3a11b 100644 --- a/pygtftk/fasta_interface.py +++ b/pygtftk/fasta_interface.py @@ -8,7 +8,6 @@ from builtins import object from builtins import range from builtins import str -from collections import OrderedDict from Bio.Alphabet import IUPAC from Bio.Seq import Seq @@ -16,29 +15,18 @@ from cffi import FFI from pygtftk.Line import FastaSequence -from pygtftk.utils import GTFtkError -from pygtftk.utils import PY3 ffi = FFI() + # --------------------------------------------------------------- -# Python2/3 compatibility +# Function def # --------------------------------------------------------------- -try: - basestring -except NameError: - basestring = str - -if PY3: - from io import IOBase - - file = IOBase +def native_str(x): + return bytes(x.encode()) -if PY3: - def native_str(x): - return bytes(x.encode()) # --------------------------------------------------------------- # The FASTA class @@ -64,11 +52,9 @@ def __init__(self, fn, ptr, intron, rev_comp): >>> # The __init__ example is provided as doctest >>> # Please use get_sequences method from the GTF object. - >>> from future.utils import native_str >>> from pygtftk.fasta_interface import FASTA >>> from pygtftk.gtf_interface import GTF - >>> from pygtftk.utils import PY3 - >>> if PY3: native_str=lambda x:bytes(x.encode()) + >>> native_str=lambda x:bytes(x.encode()) >>> from pygtftk.utils import get_example_file >>> a_file = get_example_file("simple", "gtf")[0] >>> a_gtf = GTF(a_file) @@ -171,8 +157,11 @@ def transcript_as_bioseq_records(self): yield record + """ + This should be rewritten carefully. + def iter_features(self, feat="exon", no_feat_name=False): - """Iterate over features. + Iterate over features. :param feat: The feature type (exon, CDS). :param no_feat_name: Don't write the feature type in the header. @@ -200,7 +189,7 @@ def iter_features(self, feat="exon", no_feat_name=False): >>> assert [rec.sequence for rec in a_list if rec.transcript_id == 'G0008T001'] == ['agcgc', 'atg'] >>> assert [rec.sequence for rec in a_list if rec.transcript_id == 'G0004T001'] == ['atct', 'g', 'gcg'] - """ + if not self.intron: GTFtkError("Can't iter_features() if self.intron is False.") @@ -238,7 +227,7 @@ def iter_features(self, feat="exon", no_feat_name=False): yield fs def enumerate(self, type="any", add_feature=False): - """Iterate transcript wise and return tx_id and a list of exons""" + Iterate transcript wise and return tx_id and a list of exons for i in range(self._data.nb): tx = self._data.sequence[i] tx_seq = tx.sequence @@ -258,7 +247,7 @@ def enumerate(self, type="any", add_feature=False): yield tx.header, seq_list def as_dict(self, feat="exon"): - """Iterate feature wise + Iterate feature wise :param feat: The feature type (exon, CDS). @@ -284,7 +273,7 @@ def as_dict(self, feat="exon"): >>> assert a_dict[('G0004', 'G0004T002', 'chr1', 74, 75, '+', 'CDS')] == 'gc' >>> assert a_dict[('G0006', 'G0006T001', 'chr1', 22, 25, '-', 'CDS')] == 'acat' >>> assert a_dict[('G0006', 'G0006T001', 'chr1', 28, 30, '-', 'CDS')] == 'att' - """ + d_out = OrderedDict() @@ -330,6 +319,7 @@ def as_dict(self, feat="exon"): b.strand.decode(), name)] = seq[s:e + 1] return d_out + """ def __getitem__(self, x=None): if 0 <= x < self._data.nb: diff --git a/pygtftk/gtf_interface.py b/pygtftk/gtf_interface.py index 1679869d..e7a14575 100644 --- a/pygtftk/gtf_interface.py +++ b/pygtftk/gtf_interface.py @@ -15,6 +15,7 @@ import gc import glob +import io import os import re import sys @@ -27,7 +28,6 @@ from collections import defaultdict from cffi import FFI -from future.utils import native_str from pybedtools.bedtool import BedTool from pyparsing import CaselessLiteral from pyparsing import Combine @@ -47,7 +47,6 @@ from pygtftk.fasta_interface import FASTA from pygtftk.tab_interface import TAB from pygtftk.utils import GTFtkError -from pygtftk.utils import PY3 from pygtftk.utils import check_file_or_dir_exists from pygtftk.utils import chomp from pygtftk.utils import chrom_info_to_bed_file @@ -55,24 +54,15 @@ from pygtftk.utils import make_tmp_file from pygtftk.utils import message + # --------------------------------------------------------------- -# Python2/3 compatibility +# Function definition # --------------------------------------------------------------- -try: - basestring -except NameError: - basestring = str - -if PY3: - from io import IOBase - - file = IOBase +def native_str(x): + return bytes(x.encode()) -if PY3: - def native_str(x): - return bytes(x.encode()) # --------------------------------------------------------------- # find module path @@ -435,7 +425,7 @@ def __init__( if isinstance(input_obj, list): input_obj = input_obj[0] - if isinstance(input_obj, file): + if isinstance(input_obj, io.IOBase): if input_obj.name != '': self.fn = input_obj.name @@ -443,7 +433,7 @@ def __init__( self.fn = "-" self._data = 0 - elif isinstance(input_obj, basestring): + elif isinstance(input_obj, str): if input_obj == '-': self.fn = "-" @@ -495,7 +485,7 @@ def __init__( else: self._data = new_data - self._message("GTF created ", type="DEBUG_MEM") + self.message("GTF created ", type="DEBUG_MEM") self._ptr_addr += [id(self._data)] # --------------------------------------------------------------- @@ -575,7 +565,7 @@ def merge_attr(self, feat="*", keys="gene_id,transcript_id", return self._clone(new_data) - def _message(self, msg="", type='DEBUG'): + def message(self, msg="", type='DEBUG'): """A processing message whose verbosity is adapted based on pygtftk.utils.VERBOSITY. >>> import pygtftk.utils @@ -585,9 +575,9 @@ def _message(self, msg="", type='DEBUG'): >>> a_gtf = GTF(a_file) >>> pygtftk.utils.VERBOSITY = 0 >>> pygtftk.utils.VERBOSITY = 2 - >>> a_gtf._message('bla') + >>> a_gtf.message('bla') >>> pygtftk.utils.VERBOSITY = 3 - >>> a_gtf._message('bla') + >>> a_gtf.message('bla') >>> pygtftk.utils.VERBOSITY = 0 """ @@ -598,7 +588,7 @@ def _message(self, msg="", type='DEBUG'): if pygtftk.utils.VERBOSITY >= 3: msg = msg + \ - "(#l={a}, p={c}, f={b}, i={d}, n={e})." + " (#l={a}, p={c}, f={b}, i={d}, n={e})." msg = msg.format(a=self._data.size, b=self.fn, c=addr, @@ -630,14 +620,14 @@ def __del__(self): if self._data != 0: if gc.isenabled(): self._dll.free_gtf_data(self._data) - self._message("GTF deleted ", type="DEBUG_MEM") + self.message("GTF deleted ", type="DEBUG_MEM") self._data = 0 def head(self, nb=6, returned=False): """ Print the nb first lines of the GTF object. - :param n: The number of line to display. + :param nb: The number of line to display. :param returned: If True, don't print but returns the message. """ @@ -677,7 +667,7 @@ def tail(self, nb=6): """ Print the nb last lines of the GTF object. - :param n: The number of line to display. + :param nb: The number of line to display. """ nb_rec = len(self) @@ -802,7 +792,7 @@ def __getitem__(self, x=None): """ - self._message("Subsetting GTF instance") + self.message("Subsetting GTF instance") if isinstance(x, tuple): if not len(x): @@ -959,7 +949,7 @@ def extract_data(self, raise GTFtkError(msg) if not isinstance(keys, list): - if isinstance(keys, basestring): + if isinstance(keys, str): keys = keys.split(",") else: raise GTFtkError("Please provide a key as str or list.") @@ -1203,8 +1193,6 @@ def extract_data_iter_list(self, keys=None, zero_based=False, nr=False): else: nr = 0 - key_list = keys.split(",") - message("Calling extract_data_iter.", type="DEBUG") if not isinstance(keys, list): @@ -1444,10 +1432,10 @@ def select_by_key(self, key=None, else: - if not isinstance(key, basestring): + if not isinstance(key, str): raise GTFtkError("Key should be a string") - if not isinstance(value, basestring): + if not isinstance(value, str): raise GTFtkError("Value should be a unicode string") new_data = self._dll.select_by_key(self._data, @@ -1601,18 +1589,21 @@ def select_by_loc(self, chr_str, start_str, end_str): if isinstance(start_str, list): start_str = [str(x) for x in start_str] start_str = ",".join(start_str) + elif isinstance(start_str, int): start_str = str(start_str) if isinstance(end_str, list): end_str = [str(x) for x in end_str] end_str = ",".join(end_str) + elif isinstance(end_str, int): end_str = str(end_str) chr_list = chr_str.split(",") start_list = start_str.split(",") start_list = [int(x) for x in start_list] + end_list = end_str.split(",") end_list = [int(x) for x in end_list] @@ -1626,6 +1617,7 @@ def select_by_loc(self, chr_str, start_str, end_str): msg = "Calling select_by_loc ({n} locations)." msg = msg.format(n=nb_loc) message(msg, type="DEBUG") + # GTF_DATA *gtf_data, int nb_loc, char **chr, int *begin_gl, int # *end_gl new_data = self._dll.select_by_genomic_location(self._data, @@ -1657,16 +1649,13 @@ def select_by_max_exon_nb(self): info = self.extract_data("gene_id,transcript_id", as_list_of_list=True, - nr=True, - no_na=True, hide_undef=True) + nr=True, no_na=True, hide_undef=True) gene_to_tx_max_exon = OrderedDict() for i in info: gene_id, tx_id = i - gene_id = gene_id - tx_id = tx_id if gene_id in gene_to_tx_max_exon: if nb_exons[tx_id] > nb_exons[gene_to_tx_max_exon[gene_id]]: @@ -1712,7 +1701,7 @@ def select_by_number_of_exons(self, min=0, max=None): def select_by_numeric_value(self, bool_exp=None, - na_omit=[".", "?"]): + na_omit=(".", "?")): """Test a numeric value. Select lines using a boolean operation on attributes. The boolean expression must contain attributes enclosed with braces. Example: "cDNA_length > 200 and tx_genomic_length > 2000". @@ -1720,7 +1709,7 @@ def select_by_numeric_value(self, start, end, score or frame. :param bool_exp: A simple boolean operation. And/or operation are not supported at the moment. - :param na_omit: Any line for which one of the tested value is in this list wont be evaluated (e.g. [".", "?"]). + :param na_omit: Any line for which one of the tested value is in this list wont be evaluated (e.g. (".", "?")). :Example: @@ -1729,7 +1718,7 @@ def select_by_numeric_value(self, >>> from pygtftk.gtf_interface import GTF >>> a_file = get_example_file()[0] >>> a_gtf = GTF(a_file) - >>> b_gtf = a_gtf.add_attr_from_list(feat="transcript", key="transcript_id", key_value=["G0001T001","G0002T001","G0003T001","G0004T001"], new_key="test", new_key_value=["10","11","20","40"]) + >>> b_gtf = a_gtf.add_attr_from_list(feat="transcript", key="transcript_id", key_value=("G0001T001","G0002T001","G0003T001","G0004T001"), new_key="test", new_key_value=("10","11","20","40")) >>> c_list = b_gtf.select_by_key("feature","transcript").select_by_numeric_value("test > 2").extract_data("test", as_list=True) >>> assert c_list == ['10', '11', '20', '40'] >>> a_file = get_example_file(datasetname="mini_real", ext="gtf.gz")[0] @@ -1744,12 +1733,17 @@ def select_by_numeric_value(self, >>> assert len(a_gtf.select_by_numeric_value("phase > 0 and phase < 2", na_omit=".").extract_data('phase', as_list=True, nr=True)) == 1 """ - if na_omit is not None: - if not isinstance(na_omit, list): - na_omit = na_omit.split(",") + if isinstance(na_omit, str): + na_omit = tuple(na_omit.split(",")) + if isinstance(na_omit, list): + na_omit = tuple(na_omit) + elif na_omit is None: + na_omit = () - def _find_keys(pr, the_key='key', res=[], visited=0): + def _find_keys(pr, the_key='key', res=None, visited=0): """Should be called like that: _find_keys(pr, res=[]).""" + if res is None: + res = [] if isinstance(pr, ParseResults): if visited == 0: if pr.haskeys(): @@ -1822,29 +1816,17 @@ def _embed(s, l, t): result = [] pos = 0 - if na_omit is None: - for i in tab: - + for i in tab: + if not any([True if x in na_omit else False for x in i]): try: [float(x) for x in i] if eval(parsed_exp_str): result += [pos] except: - msg = "Found non numeric values in: '%s'. Use -n/a_omit." % ",".join(i) + msg = "Found non numeric values in: '%s'." % ",".join( + i) GTFtkError(msg) - pos += 1 - else: - for i in tab: - if not any([True if x in na_omit else False for x in i]): - try: - [float(x) for x in i] - if eval(parsed_exp_str): - result += [pos] - except: - msg = "Found non numeric values in: '%s'." % ",".join( - i) - GTFtkError(msg) - pos += 1 + pos += 1 # Call C function if len(result) < 1: @@ -1999,7 +1981,7 @@ def add_attr_from_file(self, if inputfile is None: raise GTFtkError("Need an input/join file.") - if isinstance(inputfile, basestring): + if isinstance(inputfile, str): inputfile = open(inputfile) message("Reading file to join.", type="DEBUG") @@ -2053,8 +2035,8 @@ def add_attr_from_matrix_file(self, inputfile=None): """Add key/value pairs to the GTF file. Expect a matrix with row names as target keys column names as novel key and each cell as value. - :param feat: The comma separated list of target feature. If None, all the features. - :param key: The name of the key used for joining (i.e the key corresponding to value provided in the file). + :param feat: The comma separated list of target features. If None, all the features. + :param key: The name of the key to use for joining (i.e the key corresponding to value provided in the file). :param inputfile: A two column (e.g transcript_id and new value) file. :Example: @@ -2078,7 +2060,7 @@ def add_attr_from_matrix_file(self, if inputfile is None: raise GTFtkError("Need an input/join file.") - if isinstance(inputfile, file): + if isinstance(inputfile, io.IOBase): inputfile = inputfile.name id_to_val = defaultdict(lambda: defaultdict(list)) @@ -2137,13 +2119,13 @@ def add_attr_from_matrix_file(self, def add_attr_from_list(self, feat=None, key="transcript_id", - key_value=[], + key_value=(), new_key="new_key", - new_key_value=[]): + new_key_value=()): """Add key/value pairs to the GTF object. - :param feat: The comma separated list of target feature. If None, all the features. - :param key: The name of the key used for joining (e.g 'transcript_id'). + :param feat: The comma separated list of target features. If None, all the features. + :param key: The name of the key to use for joining (e.g 'transcript_id'). :param key_value: The values for the key (e.g ['tx_1', 'tx_2',...,'tx_n']) :param new_key: A name for the novel key. :param new_key_value: A name for the novel key (e.g ['val_tx_1', 'val_tx_2',...,'val_tx_n']). @@ -2155,19 +2137,18 @@ def add_attr_from_list(self, >>> from pygtftk.utils import TAB >>> a_file = get_example_file()[0] >>> a_gtf = GTF(a_file) - >>> b_gtf = a_gtf.add_attr_from_list(feat="gene", key="gene_id", key_value=["G0001", "G0002"], new_key="coding_pot", new_key_value=["0.5", "0.8"]) + >>> b_gtf = a_gtf.add_attr_from_list(feat="gene", key="gene_id", key_value=("G0001", "G0002"), new_key="coding_pot", new_key_value=("0.5", "0.8")) >>> assert b_gtf.extract_data(keys="coding_pot", as_list=True, no_na=True, hide_undef=True) == ['0.5', '0.8'] - >>> b_gtf = a_gtf.add_attr_from_list(feat="gene", key="gene_id", key_value=["G0002", "G0001"], new_key="coding_pot", new_key_value=["0.8", "0.5"]) + >>> b_gtf = a_gtf.add_attr_from_list(feat="gene", key="gene_id", key_value=("G0002", "G0001"), new_key="coding_pot", new_key_value=("0.8", "0.5")) >>> assert b_gtf.extract_data(keys="coding_pot", as_list=True, no_na=True, hide_undef=True) == ['0.5', '0.8'] - >>> key_value = a_gtf.extract_data("transcript_id", no_na=True, as_list=True, nr=True) - >>> b=a_gtf.add_attr_from_list(None, key="transcript_id", key_value=key_value, new_key="bla", new_key_value=[str(x) for x in range(len(key_value))]) + >>> key_value = tuple(a_gtf.extract_data("transcript_id", no_na=True, as_list=True, nr=True)) + >>> b=a_gtf.add_attr_from_list(None, key="transcript_id", key_value=key_value, new_key="bla", new_key_value=tuple([str(x) for x in range(len(key_value))])) """ message("Calling add_attr_from_list", type="DEBUG") - if not isinstance(key_value, list) or not isinstance( - new_key_value, list): - raise GTFtkError("key_value and new_key_value should be lists.") + if not isinstance(key_value, tuple) or not isinstance(new_key_value, tuple): + raise GTFtkError("key_value and new_key_value should be tuple.") if feat is None: feat = ",".join(self.get_feature_list(nr=True)) @@ -2406,7 +2387,7 @@ def write(self, output, add_chr=0, gc_off=False): message("Garbage collector has been disabled.", type="DEBUG") gc.disable() - self._message("Writing a GTF ") + self.message("Writing a GTF ") if pygtftk.utils.ADD_CHR == 1: add_chr = 1 @@ -2414,7 +2395,7 @@ def write(self, output, add_chr=0, gc_off=False): if isinstance(output, list): output = output[0] - if isinstance(output, basestring): + if isinstance(output, str): if output == "-": output_str = "-" else: @@ -2425,7 +2406,7 @@ def write(self, output, add_chr=0, gc_off=False): raise GTFtkError("Unable to open file %s" % output) output_str = output.name - elif isinstance(output, file): + elif isinstance(output, io.IOBase): if output.name != '': output.close() output_str = output.name @@ -2449,7 +2430,7 @@ def write(self, output, add_chr=0, gc_off=False): if output_str != "-": output.close() - self._message("GTF written ") + self.message("GTF written ") def get_sequences(self, genome=None, intron=False, rev_comp=True): """ @@ -2517,13 +2498,13 @@ def get_sequences(self, genome=None, intron=False, rev_comp=True): return None def to_bed(self, - name=["gene_id"], + name=("gene_id"), sep="|", add_feature_type=False, - more_name=[]): + more_name=None): """Returns a Bedtool object (Bed6 format). - :param name: The keys that should be used to computed the 'name' column. + :param name: The keys that should be used to computed the 'name' column (a tuple). :param more_name: Additional text to add to the name (a list). :param sep: The separator used for the name (e.g 'gene_id|transcript_id". :param add_feature_type: Add the feature type to the name. @@ -2538,13 +2519,22 @@ def to_bed(self, >>> assert a_bo.field_count() == 6 >>> assert len(a_bo) == 15 >>> for i in a_bo: pass - >>> a_bo = a_gtf.select_by_key("feature", "transcript").to_bed(name=['gene_id', 'transcript_id']) + >>> a_bo = a_gtf.select_by_key("feature", "transcript").to_bed(name=('gene_id', 'transcript_id')) >>> for i in a_bo: pass - >>> a_bo = a_gtf.select_by_key("feature", "transcript").to_bed(name=['gene_id', 'transcript_id'], sep="--") + >>> a_bo = a_gtf.select_by_key("feature", "transcript").to_bed(name=('gene_id', 'transcript_id'), sep="--") >>> for i in a_bo: pass """ + name = list(name) + + if more_name is None: + more_name = [] + elif isinstance(more_name, str): + more_name = list(more_name) + elif isinstance(more_name, tuple): + more_name = list(more_name) + message("Calling 'to_bed' method.", type="DEBUG") tx_bed = make_tmp_file("to_bed", ".bed") @@ -2578,10 +2568,10 @@ def to_bed(self, def get_5p_end(self, feat_type="transcript", - name=["transcript_id"], + name=("transcript_id"), sep="|", as_dict=False, - more_name=[], + more_name=(), one_based=False, feature_name=None, explicit=False): @@ -2591,7 +2581,7 @@ def get_5p_end(self, :param feat_type: The feature type. :param name: The key that should be used to computed the 'name' column. :param sep: The separator used for the name (e.g 'gene_id|transcript_id". - :param more_name: Additional text to add to the name (a list). + :param more_name: Additional text to add to the name (a tuple). :param as_dict: return the result as a dictionnary. :param one_based: if as_dict is requested, return coordinates in on-based format. :param feature_name: A feature name to be added to the 4th column. @@ -2614,6 +2604,19 @@ def get_5p_end(self, >>> assert i.name == 'transcript_id=G0001T002|gene_id=G0001' """ + if isinstance(name, tuple): + name = list(name) + elif isinstance(name, str): + name = [name] + + if isinstance(more_name, tuple): + more_name = list(more_name) + elif isinstance(more_name, str): + more_name = more_name.split(',') + + if feature_name is None: + feature_name = [] + message("Calling 'get_5p_end'.", type="DEBUG") tx_bed = make_tmp_file("TSS", ".bed") @@ -2624,12 +2627,8 @@ def get_5p_end(self, name_out = [] - if feature_name is None: - value_name = name_list + more_name - key_name = name + ["more_name"] - else: - value_name = name_list + more_name + [feature_name] - key_name = name + ["more_name"] + ["feature_name"] + value_name = name_list + more_name + feature_name + key_name = name + ['more_name'] + ['feature_name'] if explicit: for k, v in zip(key_name, value_name): @@ -2660,10 +2659,10 @@ def get_5p_end(self, return bed_obj def get_tss(self, - name=["transcript_id"], + name=("transcript_id"), sep="|", as_dict=False, - more_name=[], + more_name=(), one_based=False, feature_name=None, explicit=False): @@ -2671,7 +2670,7 @@ def get_tss(self, (zero-based coordinate). :param name: The key that should be used to computed the 'name' column. - :param more_name: Additional text to add to the name (a list). + :param more_name: Additional text to add to the name (a tuple). :param sep: The separator used for the name (e.g 'gene_id|transcript_id". :param as_dict: return the result as a dictionnary. :param one_based: if as_dict is requested, return coordinates in on-based format. @@ -2689,6 +2688,12 @@ def get_tss(self, """ + if isinstance(more_name, tuple): + more_name = list(more_name) + + if isinstance(name, tuple): + name = list(name) + return (self.get_5p_end(feat_type="transcript", name=name, more_name=more_name, @@ -2700,10 +2705,10 @@ def get_tss(self, def get_3p_end(self, feat_type="transcript", - name=["transcript_id"], + name=("transcript_id"), sep="|", as_dict=False, - more_name=[], + more_name=(), feature_name=None, explicit=False): """Returns a Bedtool object containing the 3' coordinates of selected @@ -2731,8 +2736,25 @@ def get_3p_end(self, >>> for i in a_bed: break >>> assert i.name == 'gene_id=G0001|exon_id=G0001T002E001' """ + message("Calling 'get_3p_end'.", type="DEBUG") + if isinstance(name, tuple): + name = list(name) + elif isinstance(name, str): + name = [name] + + if isinstance(more_name, tuple): + more_name = list(more_name) + elif isinstance(more_name, str): + more_name = more_name.split(',') + + if feature_name is None: + feature_name = [] + + if isinstance(name, tuple): + name = list(name) + tx_bed = make_tmp_file("TTS", ".bed") for i in self.select_by_key("feature", feat_type): @@ -2740,12 +2762,8 @@ def get_3p_end(self, upon_none='set_na') name_out = [] - if feature_name is None: - value_name = name_list + more_name - key_name = name + ["more_name"] - else: - value_name = name_list + more_name + [feature_name] - key_name = name + ["more_name"] + ["feature_name"] + value_name = name_list + more_name + feature_name + key_name = name + more_name + feature_name if explicit: for k, v in zip(key_name, value_name): @@ -2772,10 +2790,10 @@ def get_3p_end(self, return bed_obj def get_tts(self, - name=["transcript_id"], + name=("transcript_id"), sep="|", as_dict=False, - more_name=[], + more_name=(), feature_name=None, explicit=False ): @@ -2799,6 +2817,13 @@ def get_tts(self, >>> assert len(a_bed) == 15 """ + + if isinstance(more_name, tuple): + more_name = list(more_name) + + if isinstance(name, tuple): + name = list(name) + return (self.get_3p_end(feat_type="transcript", name=name, sep=sep, @@ -2915,7 +2940,7 @@ def get_intergenic(self, message("Calling 'get_intergenic'.", type="DEBUG") - if not isinstance(chrom_file, file): + if not isinstance(chrom_file, io.IOBase): raise GTFtkError('chrom_file should be a file object.') if not os.path.exists(chrom_file.name): @@ -2956,7 +2981,7 @@ def get_intergenic(self, def get_introns(self, by_transcript=False, - name=['transcript_id', 'gene_id'], + name=('transcript_id', 'gene_id'), sep='|', intron_nb_in_name=False, feat_name=False, @@ -2981,6 +3006,9 @@ def get_introns(self, """ + if isinstance(name, tuple): + name = list(name) + message("Calling 'get_intron'.", type="DEBUG") if not by_transcript: @@ -3076,7 +3104,7 @@ def get_introns(self, return introns_bo def get_midpoints(self, - name=["transcript_id", "gene_id"], + name=("transcript_id", "gene_id"), sep="|"): """Returns a bedtools object containing the midpoints of features. @@ -3094,6 +3122,9 @@ def get_midpoints(self, """ + if isinstance(name, tuple): + name = list(name) + message("Calling 'get_midpoints'.", type="DEBUG") midpoints_bed = make_tmp_file("Midpoints", ".bed") @@ -3229,7 +3260,6 @@ def get_feature_list(self, nr=False): >>> assert len(a_feat) == 4 >>> a_feat = a_gtf.get_feature_list(nr=False) >>> assert len(a_feat) == 70 - """ message("Calling 'get_feature_list'.", type="DEBUG") @@ -3350,7 +3380,7 @@ def add_attr_column(self, input_file=None, new_key="new_key"): >>> assert [int(x) for x in a_list] == list(range(70)) """ - if isinstance(input_file, basestring): + if isinstance(input_file, str): input_file = open(input_file) if input_file.closed: @@ -3393,7 +3423,7 @@ def add_attr_to_pos(self, input_file=None, new_key="new_key"): >>> assert a_list[3] == 'CCC' """ - if isinstance(input_file, basestring): + if isinstance(input_file, str): input_file = open(input_file) if input_file.closed: @@ -3421,7 +3451,6 @@ def add_attr_to_pos(self, input_file=None, new_key="new_key"): if __name__ == "__main__": from pygtftk.utils import get_example_file - from pygtftk.gtf_interface import GTF a = get_example_file() gtf = GTF(a[0]) diff --git a/pygtftk/plugins/add_exon_nb.py b/pygtftk/plugins/add_exon_nb.py index 530e13fd..27450d38 100644 --- a/pygtftk/plugins/add_exon_nb.py +++ b/pygtftk/plugins/add_exon_nb.py @@ -5,7 +5,7 @@ import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -27,15 +27,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-k', '--exon-numbering-key', help="The name of the key containing the exon numbering.", @@ -47,18 +45,15 @@ def make_parser(): def add_exon_nb(inputfile=None, outputfile=None, - exon_numbering_key=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + exon_numbering_key=None): """Add the exon number to each exon (based on 5' to 3' orientation).""" message("Calling nb_exons.", type="DEBUG") - gtf = GTF(inputfile.name, - check_ensembl_format=False - ).add_exon_number(exon_numbering_key - ).write(outputfile, gc_off=True) + GTF(inputfile.name, + check_ensembl_format=False + ).add_exon_number(exon_numbering_key + ).write(outputfile, gc_off=True) close_properly(inputfile, outputfile) diff --git a/pygtftk/plugins/add_prefix.py b/pygtftk/plugins/add_prefix.py index 5091b451..f83ba216 100644 --- a/pygtftk/plugins/add_prefix.py +++ b/pygtftk/plugins/add_prefix.py @@ -69,10 +69,7 @@ def add_prefix(inputfile=None, key="transcript_id", text=None, target_feature="*", - suffix=False, - tmp_dir=None, - logger_file=None, - verbosity=None): + suffix=False): """ Add a prefix to target values. """ diff --git a/pygtftk/plugins/apropos.py b/pygtftk/plugins/apropos.py index e5d3e492..0d6291b7 100644 --- a/pygtftk/plugins/apropos.py +++ b/pygtftk/plugins/apropos.py @@ -34,10 +34,7 @@ def make_parser(): def apropos(keyword="", - notes=False, - tmp_dir=None, - logger_file=None, - verbosity=0): + notes=False): """ Search in all command description files those related to a user-defined keyword. """ diff --git a/pygtftk/plugins/bed_to_gtf.py b/pygtftk/plugins/bed_to_gtf.py index c133014a..dfbb34c9 100644 --- a/pygtftk/plugins/bed_to_gtf.py +++ b/pygtftk/plugins/bed_to_gtf.py @@ -6,12 +6,12 @@ import argparse import os import sys - from builtins import str + from pybedtools import BedTool import pygtftk.utils -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.utils import chomp from pygtftk.utils import close_properly @@ -37,17 +37,13 @@ def make_parser(): "behave as if it was a GTF.", default=sys.stdin, metavar="BED", - type=FileWithExtension('r', - valid_extensions=('\.[Bb][Ee][Dd]$', - '\.[Bb][Ee][Dd]3$', - '\.[Bb][Ee][Dd]6$'))) + type=arg_formatter.bed_rw('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-t', '--ft-type', help="The type of features you are trying to " @@ -68,10 +64,7 @@ def bed_to_gtf( inputfile=None, outputfile=None, ft_type="transcript", - source="Unknown", - tmp_dir=None, - logger_file=None, - verbosity=0): + source="Unknown"): """ Convert a bed file to a gtf. This will make the poor bed feel as if it was a nice gtf (but with lots of empty fields...). May be helpful sometimes... diff --git a/pygtftk/plugins/closest_genes.py b/pygtftk/plugins/closest_genes.py index 73c69a29..86d863c4 100644 --- a/pygtftk/plugins/closest_genes.py +++ b/pygtftk/plugins/closest_genes.py @@ -8,7 +8,7 @@ from _collections import defaultdict from builtins import zip -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -36,20 +36,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF/TXT", - type=FileWithExtension('w', - valid_extensions=('\.[Gg][Tt][Ff]$', - '\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]', - '\.[Cc][Oo][Vv]'))) + type=arg_formatter.gtf_or_txt_rw('w')) parser_grp.add_argument('-r', '--from-region-type', help="What is region to consider for each gene.", @@ -115,10 +108,7 @@ def closest_genes( diff_strandedness=False, text_format=False, identifier="gene_id", - collapse=False, - tmp_dir=None, - logger_file=None, - verbosity=0): + collapse=False): """ Find the n closest genes for each gene. """ @@ -196,10 +186,6 @@ def closest_genes( else: message("Unknown type.", type="ERROR") - strands = gn_gtf.extract_data(identifier + ",strand", - as_dict_of_values=True, - hide_undef=True) - # ---------------------------------------------------------------------- # Search closest genes # ---------------------------------------------------------------------- diff --git a/pygtftk/plugins/col_from_tab.py b/pygtftk/plugins/col_from_tab.py index cff4ba76..b2c399ca 100644 --- a/pygtftk/plugins/col_from_tab.py +++ b/pygtftk/plugins/col_from_tab.py @@ -7,7 +7,7 @@ import sys from builtins import range -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.utils import chomp from pygtftk.utils import message from pygtftk.utils import write_properly @@ -27,22 +27,14 @@ def make_parser(): parser_grp.add_argument('-i', '--inputfile', help="The tabulated file. Default to STDIN", default=sys.stdin, - metavar="GTF", - type=FileWithExtension('r', - valid_extensions=('\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]'))) + metavar="TXT", + type=arg_formatter.txt_rw('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="TXT", - type=FileWithExtension('w', - valid_extensions=('\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]'))) + type=arg_formatter.txt_rw('w')) parser_grp.add_argument('-c', '--columns', help="The list (csv) of column names.", @@ -78,10 +70,7 @@ def col_from_tab(inputfile=None, invert_match=False, no_header=False, unique=False, - separator=None, - tmp_dir=None, - logger_file=None, - verbosity=None): + separator=None): """Select columns from a tabulated file based on their names.""" line_set = dict() diff --git a/pygtftk/plugins/control_list.py b/pygtftk/plugins/control_list.py index aaa4d636..81177a89 100755 --- a/pygtftk/plugins/control_list.py +++ b/pygtftk/plugins/control_list.py @@ -21,9 +21,9 @@ theme, element_blank, theme_bw, scale_fill_manual, geom_violin) from plotnine import ggplot +from plotnine.exceptions import PlotnineError -from pygtftk.arg_formatter import FileWithExtension -from pygtftk.arg_formatter import int_greater_than_null +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.utils import chomp from pygtftk.utils import is_hex_color @@ -55,25 +55,16 @@ def make_parser(): metavar='TXT', help='A two columns tab-file. See notes.', default=None, - type=FileWithExtension('r', - valid_extensions=('\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]')), + type=arg_formatter.txt_rw('r'), required=True) - parser_grp.add_argument('--referenceGeneFile', '-r', + parser_grp.add_argument('--reference-gene-file', '-r', metavar='TXT', help='The file containing the reference gene list (1 column,' ' transcript ids).' ' No header.', default=None, - type=FileWithExtension('r', - valid_extensions=('\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]', - '\.[Ii][Dd][Ss]')), + type=arg_formatter.txt_rw('r'), required=True) parser_grp.add_argument('--out-dir', '-o', @@ -96,13 +87,19 @@ def make_parser(): parser_grp.add_argument('-pw', '--page-width', help='Output pdf file width (e.g. 7 inches).', - type=int_greater_than_null, + type=arg_formatter.ranged_num(lowest=0, + highest=None, + linc=False, + val_type='float'), default=None, required=False) parser_grp.add_argument('-ph', '--page-height', help='Output file height (e.g. 5 inches).', - type=int_greater_than_null, + type=arg_formatter.ranged_num(lowest=0, + highest=None, + linc=False, + val_type='float'), default=None, required=False) @@ -114,7 +111,10 @@ def make_parser(): parser_grp.add_argument('-dpi', '--dpi', help='Dpi to use.', - type=int_greater_than_null, + type=arg_formatter.ranged_num(lowest=0, + highest=None, + linc=False, + val_type='int'), default=300, required=False) @@ -150,7 +150,7 @@ def make_parser(): def control_list(in_file=None, out_dir=None, - referenceGeneFile=None, + reference_gene_file=None, log2=False, page_width=None, page_height=None, @@ -161,10 +161,7 @@ def control_list(in_file=None, dpi=300, rug=False, jitter=False, - skip_first=False, - tmp_dir=None, - logger_file=None, - verbosity=None): + skip_first=False): # ------------------------------------------------------------------------- # # Check in_file content @@ -251,7 +248,11 @@ def control_list(in_file=None, # # ------------------------------------------------------------------------- - reference_genes = pd.read_csv(referenceGeneFile.name, sep="\t", header=None) + try: + reference_genes = pd.read_csv(reference_gene_file.name, sep="\t", header=None) + except pd.errors.EmptyDataError: + message("No genes in --reference-gene-file.", type="ERROR") + reference_genes.rename(columns={reference_genes.columns.values[0]: 'gene'}, inplace=True) # ------------------------------------------------------------------------- @@ -413,7 +414,12 @@ def fxn(): fxn() message("Saving diagram to file : " + img_file.name) message("Be patient. This may be long for large datasets.") - p.save(filename=img_file.name, width=page_width, height=page_height, dpi=dpi, limitsize=False) + + try: + p.save(filename=img_file.name, width=page_width, height=page_height, dpi=dpi, limitsize=False) + except PlotnineError as err: + message("Plotnine message: " + err.message) + message("Plotnine encountered an error.", type="ERROR") # ------------------------------------------------------------------------- # diff --git a/pygtftk/plugins/convergent.py b/pygtftk/plugins/convergent.py index b8d50029..a56b4428 100644 --- a/pygtftk/plugins/convergent.py +++ b/pygtftk/plugins/convergent.py @@ -6,8 +6,8 @@ import sys from builtins import str -from pygtftk.arg_formatter import FileWithExtension -from pygtftk.arg_formatter import checkChromFile +from pygtftk import arg_formatter +from pygtftk.arg_formatter import CheckChromFile from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -38,15 +38,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('r')) parser_grp.add_argument('-c', '--chrom-info', help="Tabulated two-columns file. Chromosomes" @@ -54,7 +52,7 @@ def make_parser(): " column 2 ", default=None, metavar="CHROMINFO", - action=checkChromFile, + action=CheckChromFile, required=True) parser_grp.add_argument('-u', '--upstream', @@ -81,10 +79,7 @@ def convergent( outputfile=None, upstream=1500, downstream=1500, - chrom_info=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + chrom_info=None): """ Find transcript with convergent tts. """ diff --git a/pygtftk/plugins/convert.py b/pygtftk/plugins/convert.py index 819f669a..b9ab6437 100644 --- a/pygtftk/plugins/convert.py +++ b/pygtftk/plugins/convert.py @@ -6,7 +6,7 @@ import sys from builtins import str -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -27,17 +27,13 @@ def make_parser(): default=sys.stdin, metavar="GTF", required=False, - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="BED/BED3/BED6", - type=FileWithExtension('w', - valid_extensions=('\.[Bb][Ee][Dd]$', - '\.[Bb][Ee][Dd]3$', - '\.[Bb][Ee][Dd]6$'))) + type=arg_formatter.bed_rw('w')) parser_grp.add_argument('-n', '--names', help="The key(s) that should be used as name.", @@ -71,10 +67,7 @@ def convert(inputfile=None, format="bed", names="gene_id,transcript_id", separator="|", - more_names='', - tmp_dir=None, - logger_file=None, - verbosity=0): + more_names=''): """ Convert a GTF to various format. """ diff --git a/pygtftk/plugins/convert_ensembl.py b/pygtftk/plugins/convert_ensembl.py index 94d88abe..35794d6d 100644 --- a/pygtftk/plugins/convert_ensembl.py +++ b/pygtftk/plugins/convert_ensembl.py @@ -5,7 +5,7 @@ import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -39,15 +39,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-n', '--no-check-gene-chr', help="By default the command raise an error if several chromosomes are associated with the same gene_id. Disable this behaviour (but you should better think about what it means...).", @@ -56,21 +54,17 @@ def make_parser(): return parser -def convert_ensembl( - inputfile=None, - outputfile=None, - tmp_dir=None, - logger_file=None, - no_check_gene_chr=False, - verbosity=0): +def convert_ensembl(inputfile=None, + outputfile=None, + no_check_gene_chr=False): """ Convert the GTF file to ensembl format. """ - gtf = GTF(inputfile, - check_ensembl_format=False - ).convert_to_ensembl(check_gene_chr=not no_check_gene_chr, - ).write(outputfile, gc_off=True) + GTF(inputfile, + check_ensembl_format=False + ).convert_to_ensembl(check_gene_chr=not no_check_gene_chr, + ).write(outputfile, gc_off=True) close_properly(outputfile, inputfile) @@ -80,7 +74,7 @@ def main(): myparser = make_parser() args = myparser.parse_args() args = dict(args.__dict__) - count(**args) + convert_ensembl(**args) if __name__ == '__main__': diff --git a/pygtftk/plugins/count.py b/pygtftk/plugins/count.py index a12409e9..d525155f 100644 --- a/pygtftk/plugins/count.py +++ b/pygtftk/plugins/count.py @@ -7,7 +7,7 @@ from builtins import str from collections import OrderedDict -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -29,19 +29,13 @@ def make_parser(): default=sys.stdin, metavar="GTF", required=False, - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="TXT", - type=FileWithExtension('w', - valid_extensions=('\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]', - '\.[Cc][Oo][Vv]'))) + type=arg_formatter.txt_rw('w')) parser_grp.add_argument('-d', '--header', help="A comma-separated list of string to use as header.", @@ -64,10 +58,7 @@ def count( inputfile=None, outputfile=None, header=None, - additional_text=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + additional_text=None): """ Count the number of features in the gtf file. """ diff --git a/pygtftk/plugins/count_key_values.py b/pygtftk/plugins/count_key_values.py index cac1e29a..837121f4 100644 --- a/pygtftk/plugins/count_key_values.py +++ b/pygtftk/plugins/count_key_values.py @@ -8,7 +8,7 @@ from builtins import zip from collections import defaultdict -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -36,19 +36,13 @@ def make_parser(): default=sys.stdin, metavar="GTF", required=False, - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="TXT", - type=FileWithExtension('w', - valid_extensions=('\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]', - '\.[Cc][Oo][Vv]'))) + type=arg_formatter.txt_rw('w')) parser_grp.add_argument('-k', '--keys', default="*", @@ -76,10 +70,7 @@ def count_key_values( outputfile=None, keys="gene_id,transcript_id", uniq=True, - tmp_dir=None, - additional_text=None, - logger_file=None, - verbosity=0): + additional_text=None): """ Count the number values for a set of keys. """ diff --git a/pygtftk/plugins/coverage.py b/pygtftk/plugins/coverage.py index 32508ac1..1b6cd114 100644 --- a/pygtftk/plugins/coverage.py +++ b/pygtftk/plugins/coverage.py @@ -10,8 +10,9 @@ import pandas as pd from pybedtools import BedTool -from pygtftk.arg_formatter import FileWithExtension -from pygtftk.arg_formatter import checkChromFile +import pygtftk +from pygtftk import arg_formatter +from pygtftk.arg_formatter import CheckChromFile from pygtftk.bwig.bw_coverage import bw_cov_mp from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF @@ -48,8 +49,7 @@ def make_parser(): parser_grp.add_argument( 'bw_list', help='A list of Bigwig file (last argument).', - type=FileWithExtension('r', valid_extensions=('\.[Bb][Ww]$', - '\.[Bb][Ii][Gg][Ww][Ii][Gg]$')), + type=arg_formatter.bw_rw('r'), nargs='+') parser_grp.add_argument('-i', '--inputfile', @@ -57,126 +57,104 @@ def make_parser(): default=sys.stdin, metavar="GTF/BED", required=False, - type=FileWithExtension('r', - valid_extensions=('\.[Gg][Tt][Ff](\.[Gg][Zz])?$', - '\.[Bb][Ee][Dd]$', - '\.[Bb][Ee][Dd]3$', - '\.[Bb][Ee][Dd]6$'))) + type=arg_formatter.gtf_or_bed_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="TXT", - type=FileWithExtension('w', - valid_extensions=('\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]', - '\.[Cc][Oo][Vv]'))) - parser_grp.add_argument( - '-c', '--chrom-info', - help="Tabulated two-columns file. Chromosomes" - " as column 1 and sizes as" - " column 2 ", - default=None, - metavar="CHROMINFO", - action=checkChromFile, - required=True) - - parser_grp.add_argument( - '-u', '--upstream', - help="Extend the regions in 5' by a given value (int).", - default=0, - metavar="UPSTREAM", - type=int, - required=False) - - parser_grp.add_argument( - '-d', '--downstream', - help="Extend the regions in 3' by a given value (int).", - default=0, - metavar="DOWNSTREAM", - type=int, - required=False) - - parser_grp.add_argument( - '-w', '--nb-window', - type=int, - default=1, - help='Split the region into w bins (see -n).', - required=False) - - parser_grp.add_argument( - '-k', '--nb-proc', - type=int, - default=1, - help='Use this many threads to compute coverage.', - required=False) - - parser_grp.add_argument( - '-f', '--ft-type', - type=str, - default="promoter", - help="Region in which coverage is to be computed (promoter, intron, intergenic, tts or any feature defined in the column 3 of the GTF).", - required=False) - - parser_grp.add_argument( - '-l', '--labels', - help='Bigwig labels.', - default=None, - type=str, - required=False) - - parser_grp.add_argument( - '-m', '--name-column', - type=str, - default="transcript_id", - help="Use this ids to compute the name (4th column in " - "bed output).", - required=False) - - parser_grp.add_argument( - '-p', - '--pseudo-count', - type=int, - default=1, - help='A pseudo-count to add in case count is equal to 0.') - - parser_grp.add_argument( - '-n', '--n-highest', - type=int, - default=None, - help='For each bigwig, use the n windows with higher values to compute coverage.', - required=False) - - parser_grp.add_argument( - '-x', - '--matrix-out', - action="store_true", - help='Matrix output format. Bigwigs as column names features as rows.', - required=False) - - parser_grp.add_argument( - '-zn', '--zero-to-na', - help='Use NA not zero when region is undefined in bigwig or below window size.', - action='store_true', - required=False) - - parser_grp.add_argument( - '-a', - '--key-name', - type=str, - default="cov", - help="If gtf format is requested, the name of the key.", - required=False) - - parser_grp.add_argument( - '-s', '--stat', - type=str, - choices=['mean', 'sum'], - default='mean', - help='The statistics to be computed for each region.', - required=False) + type=arg_formatter.txt_rw('w')) + + parser_grp.add_argument('-c', '--chrom-info', + help="Tabulated two-columns file. Chromosomes" + " as column 1 and sizes as" + " column 2 ", + default=None, + metavar="CHROMINFO", + action=CheckChromFile, + required=True) + + parser_grp.add_argument('-u', '--upstream', + help="Extend the regions in 5' by a given value (int).", + default=0, + metavar="UPSTREAM", + type=int, + required=False) + + parser_grp.add_argument('-d', '--downstream', + help="Extend the regions in 3' by a given value (int).", + default=0, + metavar="DOWNSTREAM", + type=int, + required=False) + + parser_grp.add_argument('-w', '--nb-window', + type=int, + default=1, + help='Split the region into w bins (see -n).', + required=False) + + parser_grp.add_argument('-k', '--nb-proc', + type=int, + default=1, + help='Use this many threads to compute coverage.', + required=False) + + parser_grp.add_argument('-f', '--ft-type', + type=str, + default="promoter", + help="Region in which coverage is to be computed (promoter, intron, intergenic, tts or any feature defined in the column 3 of the GTF).", + required=False) + + parser_grp.add_argument('-l', '--labels', + help='Bigwig labels.', + default=None, + type=str, + required=False) + + parser_grp.add_argument('-m', '--name-column', + type=str, + default="transcript_id", + help="Use this ids to compute the name (4th column in " + "bed output).", + required=False) + + parser_grp.add_argument('-p', + '--pseudo-count', + type=int, + default=1, + help='A pseudo-count to add in case count is equal to 0.') + + parser_grp.add_argument('-n', '--n-highest', + type=int, + default=None, + help='For each bigwig, use the n windows with higher values to compute coverage.', + required=False) + + parser_grp.add_argument('-x', + '--matrix-out', + action="store_true", + help='Matrix output format. Bigwigs as column names features as rows.', + required=False) + + parser_grp.add_argument('-zn', '--zero-to-na', + help='Use NA not zero when region is undefined in bigwig or below window size.', + action='store_true', + required=False) + + parser_grp.add_argument('-a', + '--key-name', + type=str, + default="cov", + help="If gtf format is requested, the name of the key.", + required=False) + + parser_grp.add_argument('-s', '--stat', + type=str, + choices=['mean', 'sum'], + default='mean', + help='The statistics to be computed for each region.', + required=False) return parser @@ -202,10 +180,7 @@ def coverage( chrom_info=None, nb_proc=1, matrix_out=False, - tmp_dir=None, - logger_file=None, - stat='mean', - verbosity=True): + stat='mean'): """ Compute transcript coverage with one or several bigWig. """ @@ -283,18 +258,20 @@ def coverage( # # ------------------------------------------------------------------------- + name_column = name_column.split(",") + if is_gtf: message("Getting regions of interest...") - if ft_type == "intergenic": + if ft_type.lower() == "intergenic": region_bo = gtf.get_intergenic(chrom_info, 0, 0).slop(s=True, l=upstream, r=downstream, g=chrom_info.name).sort() - elif ft_type == "intron": + elif ft_type.lower() == "intron": region_bo = gtf.get_introns().slop(s=True, l=upstream, @@ -303,28 +280,29 @@ def coverage( elif ft_type == "intron_by_tx": - region_bo = gtf.get_introns(by_transcript=True + region_bo = gtf.get_introns(by_transcript=True, + name=name_column, ).slop(s=True, l=upstream, r=downstream, g=chrom_info.name).sort() - elif ft_type == "promoter": + elif ft_type.lower() in ["promoter", "tss"]: - region_bo = gtf.get_tss(name=["transcript_id"]).slop(s=True, - l=upstream, - r=downstream, - g=chrom_info.name).sort() + region_bo = gtf.get_tss(name=name_column, ).slop(s=True, + l=upstream, + r=downstream, + g=chrom_info.name).sort() - elif ft_type == "tts": + elif ft_type.lower() in ["tts", "terminator"]: - region_bo = gtf.get_tts(name=["transcript_id"]).slop(s=True, - l=upstream, - r=downstream, - g=chrom_info.name).sort() + region_bo = gtf.get_tts(name=name_column).slop(s=True, + l=upstream, + r=downstream, + g=chrom_info.name).sort() else: - name_column = name_column.split(",") + region_bo = gtf.select_by_key( "feature", ft_type, 0 @@ -361,7 +339,7 @@ def coverage( nb_proc=nb_proc, n_highest=n_highest, stat=stat, - verbose=verbosity) + verbose=pygtftk.utils.VERBOSITY) if matrix_out: result_bed.close() @@ -369,15 +347,9 @@ def coverage( df_first = pd.read_csv(result_bed.name, sep="\t", header=None) df_first = df_first.ix[:, [0, 1, 2, 3, 5, 4]] - """ - bwig = [z.split("|")[0] for z in df_first[3]] - bwig_nr = list(set(bwig)) - """ df_list = [] - """ - for i in range(len(bwig_nr)): - """ + for i in range(len(labels)): # create a sub data frame containing the coverage values of the # current bwig diff --git a/pygtftk/plugins/del_attr.py b/pygtftk/plugins/del_attr.py index 248e1fca..a4b77b2f 100644 --- a/pygtftk/plugins/del_attr.py +++ b/pygtftk/plugins/del_attr.py @@ -6,7 +6,7 @@ import re import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -31,15 +31,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-k', '--key', help='Comma separated list of attribute names or a ' @@ -68,10 +66,7 @@ def del_attr( outputfile=None, key="transcript_id", reg_exp=False, - invert_match=False, - tmp_dir=None, - logger_file=None, - verbosity=0): + invert_match=False): """ Delete extended attributes in the target gtf file. attr_list can be a comma-separated list of attributes. diff --git a/pygtftk/plugins/discretize_key.py b/pygtftk/plugins/discretize_key.py index 41148bcf..8f60620b 100644 --- a/pygtftk/plugins/discretize_key.py +++ b/pygtftk/plugins/discretize_key.py @@ -12,8 +12,7 @@ import numpy as np import pandas -from pygtftk.arg_formatter import FileWithExtension -from pygtftk.arg_formatter import int_greater_than_null +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -45,15 +44,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-k', '--src-key', help='The name of the source key', @@ -71,7 +68,10 @@ def make_parser(): help='The number of levels/classes to create.', default=2, metavar="KEY", - type=int_greater_than_null, + type=arg_formatter.ranged_num(lowest=1, + highest=None, + linc=True, + val_type='int'), required=True) parser_grp.add_argument('-l', '--labels', @@ -106,10 +106,7 @@ def discretize_key(inputfile=None, percentiles=False, percentiles_of_uniq=False, log=False, - labels=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + labels=None): """ Create a new key by discretizing a numeric key. """ @@ -218,7 +215,7 @@ def discretize_key(inputfile=None, q = q + [np.percentile(dest_values_tmp, 100)] if len(q) != len(set(q)): - message("No ties are accepted in percentiles :", + message("No ties are accepted in percentiles.", type="WARNING", force=True) message("Breaks: " + str(q), type="WARNING", force=True) @@ -258,7 +255,7 @@ def discretize_key(inputfile=None, with tmp_file as tp_file: for p, v in zip(dest_pos, breaks): - tmp_file.write(str(p) + "\t" + str(v) + '\n') + tp_file.write(str(p) + "\t" + str(v) + '\n') gtf.add_attr_to_pos(tmp_file, new_key=dest_key).write(outputfile, diff --git a/pygtftk/plugins/divergent.py b/pygtftk/plugins/divergent.py index 91796f8f..603bb464 100644 --- a/pygtftk/plugins/divergent.py +++ b/pygtftk/plugins/divergent.py @@ -6,8 +6,8 @@ import sys from builtins import str -from pygtftk.arg_formatter import FileWithExtension -from pygtftk.arg_formatter import checkChromFile +from pygtftk import arg_formatter +from pygtftk.arg_formatter import CheckChromFile from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -40,15 +40,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('r')) parser_grp.add_argument('-c', '--chrom-info', help="Tabulated two-columns file. Chromosomes" @@ -56,7 +54,7 @@ def make_parser(): " column 2", default=None, metavar="CHROMINFO", - action=checkChromFile, + action=CheckChromFile, required=True) parser_grp.add_argument('-u', '--upstream', @@ -81,7 +79,7 @@ def make_parser(): required=False) parser_grp.add_argument('-S', '--no-strandness', - help="Do not consider strandness (only look whether the promoter from a transcript overlap with the promoter from another gene).", + help="Do not consider strandness (only look whether the promoter from a transcript overlaps with the promoter from another gene).", action="store_true", required=False) diff --git a/pygtftk/plugins/exon_size.py b/pygtftk/plugins/exon_size.py index 7f6e8879..a1836fba 100644 --- a/pygtftk/plugins/exon_size.py +++ b/pygtftk/plugins/exon_size.py @@ -7,7 +7,7 @@ from builtins import str from builtins import zip -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -34,15 +34,13 @@ def make_parser(): default=sys.stdin, metavar="GTF", required=False, - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output GTF file.", default=sys.stdout, metavar="TXT", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('r')) parser_grp.add_argument('-a', '--key-name', @@ -57,15 +55,12 @@ def make_parser(): def exon_sizes( inputfile=None, outputfile=None, - key_name=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + key_name=None): """ Add a new key to transcript features containing a comma separated list of exon-size. """ - gtf = GTF(inputfile, check_ensembl_format=False) + gtf = GTF(inputfile) all_tx_ids = gtf.get_tx_ids(nr=True) tx_to_size_list = dict() diff --git a/pygtftk/plugins/feat_size.py b/pygtftk/plugins/feat_size.py index fd0da2d0..9f4eb62c 100644 --- a/pygtftk/plugins/feat_size.py +++ b/pygtftk/plugins/feat_size.py @@ -6,7 +6,7 @@ import sys from builtins import str -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import chomp @@ -35,16 +35,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file (BED).", default=sys.stdout, metavar="GTF/BED", - type=FileWithExtension('w', - valid_extensions=('\.[Gg][Tt][Ff]$', - '\.[Bb][Ee][Dd]$'))) + type=arg_formatter.gtf_or_bed_rwb('w')) parser_grp.add_argument('-t', '--ft-type', help="A target feature (as found in the 3rd " @@ -86,10 +83,7 @@ def feature_size( names="transcript_id", key_name='feature_size', separator="|", - bed=False, - tmp_dir=None, - logger_file=None, - verbosity=0): + bed=False): """ Get the size and limits (start/end) of features enclosed in the GTF. If bed format is requested returns the limits zero-based half open and the size as a score. @@ -107,8 +101,6 @@ def feature_size( names = names.split(",") - tmp_file = make_tmp_file(prefix="feature_size_", suffix=".txt") - if ft_type != 'mature_rna': if bed: diff --git a/pygtftk/plugins/get_5p_3p_coords.py b/pygtftk/plugins/get_5p_3p_coords.py index 6c5c23bb..ff1f004e 100644 --- a/pygtftk/plugins/get_5p_3p_coords.py +++ b/pygtftk/plugins/get_5p_3p_coords.py @@ -5,7 +5,7 @@ import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import chomp @@ -30,16 +30,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file (BED).", default=sys.stdout, metavar="BED", - type=FileWithExtension('w', - valid_extensions=('\.[Bb][Ee][Dd]$', - '\.[Bb][Ee][Dd]6$'))) + type=arg_formatter.bed_rw('w')) parser_grp.add_argument('-t', '--ft-type', help="The target feature (as found in the 3rd " @@ -90,10 +87,7 @@ def get_5p_3p_coords(inputfile=None, more_names='', transpose=0, invert=False, - explicit=False, - tmp_dir=None, - logger_file=None, - verbosity=0): + explicit=False): """ Get the 5p or 3p coordinate for each feature (e.g TSS or TTS for a transcript). """ diff --git a/pygtftk/plugins/get_attr_list.py b/pygtftk/plugins/get_attr_list.py index b40c4275..371c6a26 100644 --- a/pygtftk/plugins/get_attr_list.py +++ b/pygtftk/plugins/get_attr_list.py @@ -1,11 +1,10 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -26,18 +25,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="TXT", - type=FileWithExtension('w', - valid_extensions=('\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]'))) + type=arg_formatter.txt_rw('w')) parser_grp.add_argument('-s', '--separator', help="The separator to be used for separating key names.", @@ -51,10 +45,7 @@ def make_parser(): def get_attr_list( inputfile=None, outputfile=None, - separator="\n", - tmp_dir=None, - logger_file=None, - verbosity=0): + separator="\n"): """ Get the list of attributes from a GTF file. """ diff --git a/pygtftk/plugins/get_attr_value_list.py b/pygtftk/plugins/get_attr_value_list.py index f2085e1c..24265aaa 100644 --- a/pygtftk/plugins/get_attr_value_list.py +++ b/pygtftk/plugins/get_attr_value_list.py @@ -1,11 +1,10 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -26,18 +25,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="TXT", - type=FileWithExtension('w', - valid_extensions=('\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]'))) + type=arg_formatter.txt_rw('w')) parser_grp.add_argument('-k', '--key-name', help="Key name.", @@ -63,10 +57,7 @@ def get_attr_value_list( outputfile=None, key_name=None, separator="\n", - count=False, - tmp_dir=None, - logger_file=None, - verbosity=0): + count=False): """ Get the list of values observed for an attributes. """ diff --git a/pygtftk/plugins/get_example.py b/pygtftk/plugins/get_example.py index f6595c2a..bb881a0a 100644 --- a/pygtftk/plugins/get_example.py +++ b/pygtftk/plugins/get_example.py @@ -1,5 +1,4 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import glob @@ -42,6 +41,8 @@ def make_parser(): "simple_03", "simple_04", "simple_05", + "simple_06", + "mini_real_10M", "control_list"], default="simple", required=False) @@ -79,10 +80,7 @@ def get_example(outputfile=None, dataset=None, format="gtf", list=False, - all_dataset=False, - tmp_dir=None, - logger_file=None, - verbosity=0): + all_dataset=False): """ Print example gtf files. """ @@ -148,7 +146,7 @@ def get_example(outputfile=None, message("Copying file : " + os.path.basename(i), force=True) shutil.copy(i, ".") else: - message("Copy canceled, file already exist:" + os.path.basename(i), force=True) + message("Copy canceled, file already exist: " + os.path.basename(i), force=True) else: @@ -162,7 +160,6 @@ def get_example(outputfile=None, target_path = os.path.join(pygtftk.__path__[0], 'data', dataset) message("Copying from :" + target_path) - for i in file_path: if not os.path.exists(os.path.join(os.getcwd(), os.path.basename(i))): message("Copying file : " + os.path.basename(i), force=True) diff --git a/pygtftk/plugins/get_feat_seq.py b/pygtftk/plugins/get_feat_seq.py index 7ad8e4eb..9b01fa5e 100644 --- a/pygtftk/plugins/get_feat_seq.py +++ b/pygtftk/plugins/get_feat_seq.py @@ -1,27 +1,27 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os -import shutil +import re import sys from builtins import str -from builtins import zip -from pygtftk.arg_formatter import FileWithExtension -from pygtftk.arg_formatter import globbedFileList +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly -from pygtftk.utils import message, make_tmp_file +from pygtftk.utils import message __updated__ = "2018-01-20" __doc__ = """ - Get feature sequences in a flexible fasta format from a GTF file. + Get feature sequences (i.e. column 3) in a flexible fasta format from a GTF file. """ __notes__ = """ -- The sequences are returned in 5' to 3' orientation. -- If you want to use wildcards, use quotes :e.g. 'foo/bar*.fa'. + -- See get_tx_seq for mature RNA sequence. + -- If -\-unique is used if a header was already encountered the record won't be print. + Take care to use unambiguous identifiers in the header. """ @@ -35,22 +35,20 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output FASTA file.", default=sys.stdout, metavar="FASTA", - type=FileWithExtension('w', - valid_extensions=('\.[Ff][Aa][Ss][Tt][Aa]$', - '\.[Ff][Aa]$'))) + type=arg_formatter.fasta_rw('w')) parser_grp.add_argument('-g', '--genome', - help="The genome in fasta format. Accept path with wildcards (e.g. *.fa).", + help="The genome in fasta format.", default=None, - action=globbedFileList, - required=True) + metavar="FASTA", + required=True, + type=arg_formatter.fasta_rw('r')) parser_grp.add_argument('-s', '--separator', help="To separate info in header.", @@ -76,8 +74,13 @@ def make_parser(): action="store_true", required=False) - parser_grp.add_argument('-e', '--explicit', - help="Write explicitly the name of the keys in the header.", + parser_grp.add_argument('-r', '--rev-comp-to-header', + help="Indicate in the header whether sequence was rev-complemented.", + action="store_true", + required=False) + + parser_grp.add_argument('-u', '--unique', + help="Don't write redondant IDS.", action="store_true", required=False) @@ -90,61 +93,40 @@ def get_feat_seq(inputfile=None, feature_type="exon", separator="", no_rev_comp=False, - explicit=False, label="", - tmp_dir=None, - logger_file=None, - verbosity=0): + rev_comp_to_header=False, + unique=False): """ Description: Get transcripts sequences in fasta format from a GTF file. """ # ------------------------------------------------------------------------- - # Check args consistancy. - # + # Should sequences be reverse-complemented # ------------------------------------------------------------------------- - if feature_type in ["transcript", "gene"]: - message("Please use get_tx_seq for transcript sequence.", - type="ERROR") + force_strandedness = not no_rev_comp # ------------------------------------------------------------------------- # Check chrom to avoid segfault # https://github.com/dputhier/libgtftk/issues/27 # ------------------------------------------------------------------------- + if genome.name.endswith(".gz"): + message("Genome in gz format is not currently supported.", type="ERROR") + genome_chr_list = [] - message("%d fasta files found." % len(genome)) - - if len(genome) == 1: - message("Checking fasta file chromosome list") - genome = genome[0] - with genome as genome_file: - for i in genome_file: - if i.startswith(">"): - i = i.rstrip("\n") - genome_chr_list += [i[1:]] - else: - message("Merging fasta files") - tmp_genome = make_tmp_file(prefix="genome", suffix=".fa") - with tmp_genome as tg: - for curr_file in genome: - message("Merging %s" % curr_file.name) - with curr_file as cf: - shutil.copyfileobj(cf, tg, 1024 * 1024 * 100) - - message("Checking fasta file chromosome list") - genome = open(tmp_genome.name, "r") - with genome as genome_file: - for i in genome_file: - if i.startswith(">"): - i = i.rstrip("\n") - genome_chr_list += [i[1:]] - - rev_comp = not no_rev_comp - - gtf = GTF(inputfile) + message("Fasta files found: %s" % genome.name) + + message("Checking fasta file chromosome list") + + with genome as geno: + for i in geno: + if i.startswith(">"): + i = i.rstrip("\n") + genome_chr_list += [i[1:]] + + gtf = GTF(inputfile, check_ensembl_format=False) gtf_chr_list = gtf.get_chroms(nr=True) @@ -168,36 +150,47 @@ def get_feat_seq(inputfile=None, # ------------------------------------------------------------------------- message("Retrieving fasta sequences.") - fasta_seq = gtf.get_sequences(genome=genome.name, - intron=True, - rev_comp=rev_comp) - tx_gtf = gtf.select_by_key("feature", "transcript") + feat_seq = gtf.select_by_key("feature", + feature_type + ).to_bed(name=label.split(","), + sep=separator + ).sequence(fi=genome.name, + name=True, + s=force_strandedness) + + id_printed = set() + + to_print = True - label = ",".join([x for x in label.split(',') if x != 'feature']) + for nb_line, line in enumerate(open(feat_seq.seqfn)): + if line.startswith(">"): - if label != '': - tx_info = tx_gtf.extract_data("transcript_id," + - label, - as_dict_of_lists=True) + # This (+/-) may be added by pybedtool + # but can be accessed though --label + line = re.sub("\(\+\)$", "", line) + line = re.sub("\(\-\)$", "", line) + + if rev_comp_to_header: + if force_strandedness: + line = line + separator + "rev_comp" + else: + line = line + separator + "no_rev_comp" + + if unique: + if line in id_printed: + to_print = False + if to_print: + outputfile.write(line) + id_printed.add(line) - else: - tx_info = dict() - for i in fasta_seq.iter_features(feat=feature_type): - if not explicit: - feat_info = [feature_type] + [str(i.start)] + [str(i.end)] - header = separator.join(tx_info[i.transcript_id] + feat_info) else: - feat_info = ["feature_type=" + feature_type] + \ - ["feature_start=" + str(i.start)] + \ - ["feature_end=" + str(i.end)] - header = [str(x[0]) + "=" + x[1] - for x in zip(label.split(","), tx_info[i.transcript_id])] - header = separator.join(header + feat_info) - outputfile.write(">" + header + "\n") - outputfile.write(i.sequence + "\n") + if not to_print: + to_print = True + else: + outputfile.write(line) close_properly(outputfile, inputfile) @@ -220,27 +213,23 @@ def main(): #get_feat_seq: load dataset @test "get_feat_seq_0" { - result=`gtftk get_example -f '*' -d simple` + result=`gtftk get_example -f '*' -d simple; gtftk get_example -f '*' -d mini_real_10M; if [ ! -f chr1_hg38_10M.fa ]; then gunzip -f chr1_hg38_10M.fa.gz; fi ` [ "$result" = "" ] } #get_feat_seq: - @test "get_feat_seq_0.1" { + @test "get_feat_seq_1" { result=`gtftk get_feat_seq -i simple.gtf -g simple.fa -l feature,transcript_id,start -t exon | grep "G0003T001" -A 1| perl -ne 'chomp, print $_,"," if(/^[AaTtCcGg]+$/)'` - [ "$result" = "aatta,gcttg," ] + [ "$result" = "gcttg,aatta," ] } #get_feat_seq: - @test "get_feat_seq_1" { + @test "get_feat_seq_2" { result=`gtftk get_feat_seq -i simple.gtf -g simple.fa -l feature,transcript_id,start -t exon -n | grep "G0003T001" -A 1| perl -ne 'chomp, print $_,"," if(/^[AaTtCcGg]+$/)'` [ "$result" = "caagc,taatt," ] } - #get_feat_seq: - @test "get_feat_seq_2" { - result=`gtftk get_feat_seq -i simple.gtf -g simple.fa -l feature,transcript_id,start -t exon | grep "G0003T001" -A 1| perl -ne 'chomp, print $_,"," if(/^[AaTtCcGg]+$/)'` - [ "$result" = "aatta,gcttg," ] - } + #get_feat_seq: @test "get_feat_seq_3" { @@ -251,7 +240,7 @@ def main(): #get_feat_seq: @test "get_feat_seq_4" { result=`gtftk get_feat_seq -i simple.gtf -g simple.fa -l feature,transcript_id,start -t CDS | grep "G0006T001" -A 1| perl -ne 'chomp, print $_,"," if(/^[AaTtCcGg]+$/)'` - [ "$result" = "ct,att,acat," ] + [ "$result" = "acat,att,ct," ] } #get_feat_seq: @@ -260,19 +249,60 @@ def main(): [ "$result" = "atgt,aat,ag," ] } - #get_feat_seq: - @test "get_feat_seq_6" { - result=`gtftk get_feat_seq -i simple.gtf -g simple.fa -l feature,transcript_id,start -t CDS -n | grep "G0006T001" -A 1| perl -ne 'chomp, print $_,"," if(/^[AaTtCcGg]+$/)'` - [ "$result" = "atgt,aat,ag," ] - } - #get_feat_seq: @test "get_feat_seq_7" { result=`gtftk get_feat_seq -i simple.gtf -g simple.fa -t CDS | grep G0006T001 | perl -npe 's/\\n/,/g'` - [ "$result" = ">G0006T001|G0006|chr1|22|35|CDS|33|34,>G0006T001|G0006|chr1|22|35|CDS|28|30,>G0006T001|G0006|chr1|22|35|CDS|22|25," ] + [ "$result" = ">CDS|G0006T001|G0006|chr1|21|25,>CDS|G0006T001|G0006|chr1|27|30,>CDS|G0006T001|G0006|chr1|32|34," ] + } + + #check with a real dataset (no rev-comp) minus strand + @test "get_feat_seq_8" { + result=`gtftk select_by_key -f ids_minus_exon.txt -k exon_id -i mini_real_10M.gtf.gz | gtftk get_feat_seq -g chr1_hg38_10M.fa -l exon_id -u | perl -ne 'print uc $_' > observed_sequence_minus_exon.fa` + [ -f observed_sequence_minus_exon.fa ] } + + #get_feat_seq: + @test "get_feat_seq_9" { + result=`diff observed_sequence_minus_exon.fa expected_sequence_minus_exon.fa` + [ "$result" = "" ] + } - + #check with a real dataset (no rev-comp) plus strand + @test "get_feat_seq_10" { + result=`gtftk select_by_key -f ids_plus_exon.txt -k exon_id -i mini_real_10M.gtf.gz | gtftk get_feat_seq -g chr1_hg38_10M.fa -l exon_id -u | perl -ne 'print uc $_' > observed_sequence_plus_exon.fa` + [ -f observed_sequence_plus_exon.fa ] + } + + #get_feat_seq: + @test "get_feat_seq_11" { + result=`diff observed_sequence_plus_exon.fa expected_sequence_plus_exon.fa` + [ "$result" = "" ] + } + + #check with a real dataset (no rev-comp) minus strand + @test "get_feat_seq_12" { + result=`gtftk select_by_key -f ids_minus_exon.txt -k exon_id -i mini_real_10M.gtf.gz | gtftk get_feat_seq -g chr1_hg38_10M.fa -l exon_id -u -n | perl -ne 'print uc $_' > observed_sequence_minus_exon_no_rv.fa` + [ -f observed_sequence_minus_exon_no_rv.fa ] + } + + #get_feat_seq: + @test "get_feat_seq_13" { + result=`diff observed_sequence_minus_exon_no_rv.fa expected_sequence_minus_exon_no_rv.fa` + [ "$result" = "" ] + } + + #check with a real dataset (with rev-comp) plus strand + @test "get_feat_seq_14" { + result=`gtftk select_by_key -f ids_plus_exon.txt -k exon_id -i mini_real_10M.gtf.gz | gtftk get_feat_seq -g chr1_hg38_10M.fa -l exon_id -u -n | perl -ne 'print uc $_' > observed_sequence_plus_exon.fa` + [ -f observed_sequence_plus_exon.fa ] + } + + #get_feat_seq: + @test "get_feat_seq_15" { + result=`diff observed_sequence_plus_exon.fa expected_sequence_plus_exon.fa` + [ "$result" = "" ] + } + """ CmdObject(name="get_feat_seq", diff --git a/pygtftk/plugins/get_feature_list.py b/pygtftk/plugins/get_feature_list.py index 365c38ab..0bcefb7b 100644 --- a/pygtftk/plugins/get_feature_list.py +++ b/pygtftk/plugins/get_feature_list.py @@ -1,12 +1,11 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys from builtins import str -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -27,18 +26,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="TXT", - type=FileWithExtension('w', - valid_extensions=('\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]'))) + type=arg_formatter.txt_rw('w')) parser_grp.add_argument('-s', '--separator', help="The separator to be used for separating key names.", @@ -52,10 +46,7 @@ def make_parser(): def get_feature_list( inputfile=None, outputfile=None, - separator="", - tmp_dir=None, - logger_file=None, - verbosity=0): + separator=""): """ Get the list of features enclosed in the GTF. """ @@ -72,7 +63,7 @@ def main(): myparser = make_parser() args = myparser.parse_args() args = dict(args.__dict__) - count(**args) + get_feature_list(**args) if __name__ == '__main__': diff --git a/pygtftk/plugins/get_tx_seq.py b/pygtftk/plugins/get_tx_seq.py index a568ac07..36c172a2 100644 --- a/pygtftk/plugins/get_tx_seq.py +++ b/pygtftk/plugins/get_tx_seq.py @@ -1,5 +1,4 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os @@ -9,7 +8,7 @@ from builtins import str from builtins import zip -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.arg_formatter import globbedFileList from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF @@ -37,16 +36,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output FASTA file.", default=sys.stdout, metavar="FASTA", - type=FileWithExtension('w', - valid_extensions=('\.[Ff][Aa][Ss][Tt][Aa]$', - '\.[Ff][Aa]$'))) + type=arg_formatter.fasta_rw('w')) parser_grp.add_argument('-g', '--genome', help="The genome in fasta format. Accept path with wildcards (e.g. *.fa).", @@ -119,10 +115,7 @@ def get_tx_seq(inputfile=None, label="", sleuth_format=True, explicit=True, - assembly="bla", - tmp_dir=None, - logger_file=None, - verbosity=0): + assembly="bla"): """ Description: Get transcripts sequences in fasta format from a GTF file. """ @@ -135,6 +128,11 @@ def get_tx_seq(inputfile=None, message("%d fasta files found." % len(genome)) + as_gz_ext = [True for x in genome if x.name.endswith(".gz")] + + if any(as_gz_ext): + message("Genome in gz format is not currently supported.", type="ERROR") + if len(genome) == 1: message("Checking fasta file chromosome list") genome = genome[0] @@ -324,7 +322,7 @@ def main(): #sleuth output @test "get_tx_seq_8" { - result=`gtftk get_tx_seq -i simple.gtf -g simple.fa -f| wc -l` + result=`rm -f /tmp/get_example_shuf.gtf; gtftk get_tx_seq -i simple.gtf -g simple.fa -f| wc -l` [ "$result" -eq 30 ] } @@ -364,6 +362,52 @@ def main(): [ "$result" = ">transcript,G0001T002,chr1" ] } + # load mini_real_10M + @test "get_tx_seq_15" { + result=`gtftk get_example -f '*' -d mini_real_10M; if [ ! -f chr1_hg38_10M.fa ]; then gunzip -f chr1_hg38_10M.fa.gz; fi ` + [ "$result" = "" ] + } + + # Check the size of transcript seq compared to ensembl. + @test "get_tx_seq_16" { + result=`gtftk get_tx_seq -i mini_real_10M.gtf.gz -g chr1_hg38_10M.fa -l transcript_id | perl -ne 'if(/^>/){/>(.*)/; $id=$1}else{chomp; print $id,"\\t",length, "\\n"}' > observed_size.txt` + [ -f observed_size.txt ] + } + + # Check the size of transcript seq compared to ensembl. + @test "get_tx_seq_17" { + result=`cat observed_size.txt | md5sum-lite | sed 's/ .*//'` + [ "$result" = "1d145f52046dba514040623f1efe2072" ] + } + + # Check the sequence of tx on plus strand compared to ensembl. + # should be the same as 'cat expected_sequence_plus.fa | md5sum-lite' + @test "get_tx_seq_18" { + result=`gtftk get_tx_seq -i ids_plus.gtf -g chr1_hg38_10M.fa -l transcript_id | perl -ne 'print uc $_'> observed_sequence_plus.fa; cat observed_sequence_plus.fa | md5sum-lite | sed 's/ .*//'` + [ "$result" = "7327e4010944c2def4431bf5ef77a4f1" ] + } + + # Check the sequence of tx on plus strand compared to ensembl (no rev-comp). + # should be the same as 'cat expected_sequence_plus.fa | md5sum-lite' + @test "get_tx_seq_19" { + result=`gtftk get_tx_seq -i ids_plus.gtf -g chr1_hg38_10M.fa -l transcript_id -n | perl -ne 'print uc $_'> observed_sequence_plus.fa; cat observed_sequence_plus.fa | md5sum-lite | sed 's/ .*//'` + [ "$result" = "7327e4010944c2def4431bf5ef77a4f1" ] + } + + # Check the sequence of tx on minus strand compared to ensembl (rev_comp). + # should be the same as 'cat expected_sequence_minus_rv.fa | md5sum-lite' + @test "get_tx_seq_20" { + result=`gtftk get_tx_seq -i ids_minus.gtf -g chr1_hg38_10M.fa -l transcript_id | perl -ne 'print uc $_'> observed_sequence_minus_rv.fa; cat observed_sequence_minus_rv.fa | md5sum-lite | sed 's/ .*//'` + [ "$result" = "6f40e63555a4bb6f849261b0fe9e928c" ] + } + + # Check the sequence of tx on minus strand compared to ensembl (no rev_comp). + # should be the same as 'cat expected_sequence_minus_no_rv.fa | md5sum-lite' + @test "get_tx_seq_21" { + result=`gtftk get_tx_seq -i ids_minus.gtf -g chr1_hg38_10M.fa -l transcript_id -n | perl -ne 'print uc $_'> observed_sequence_minus_no_rv.fa; cat observed_sequence_minus_no_rv.fa | md5sum-lite | sed 's/ .*//'` + [ "$result" = "87c15b230b6057be091566ac29ada7a1" ] + } + """ CmdObject(name="get_tx_seq", diff --git a/pygtftk/plugins/intergenic.py b/pygtftk/plugins/intergenic.py index 04c5cf37..b966c002 100644 --- a/pygtftk/plugins/intergenic.py +++ b/pygtftk/plugins/intergenic.py @@ -1,13 +1,12 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys from builtins import str -from pygtftk.arg_formatter import FileWithExtension -from pygtftk.arg_formatter import checkChromFile +from pygtftk import arg_formatter +from pygtftk.arg_formatter import CheckChromFile from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import chomp @@ -33,15 +32,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file (BED).", default=sys.stdout, metavar="BED", - type=FileWithExtension('w', - valid_extensions='\.[Bb][Ee][Dd]$')) + type=arg_formatter.bed_rw('w')) parser_grp.add_argument('-c', '--chrom-info', help="Tabulated two-columns file. Chromosomes" @@ -49,7 +46,7 @@ def make_parser(): " column 2", default=None, metavar="CHROMINFO", - action=checkChromFile, + action=CheckChromFile, required=True) return parser @@ -58,10 +55,7 @@ def make_parser(): def intergenic( inputfile=None, outputfile=None, - chrom_info=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + chrom_info=None): """ Extract intergenic regions. """ diff --git a/pygtftk/plugins/intron_size.py b/pygtftk/plugins/intron_size.py index 16f0e2ad..66c99985 100644 --- a/pygtftk/plugins/intron_size.py +++ b/pygtftk/plugins/intron_size.py @@ -1,12 +1,11 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys from builtins import str -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -32,19 +31,13 @@ def make_parser(): default=sys.stdin, metavar="GTF", required=False, - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, - metavar="TXT", - type=FileWithExtension('w', - valid_extensions=('\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]', - '\.[Cc][Oo][Vv]'))) + metavar="GTF", + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-a', '--key-name', @@ -59,10 +52,7 @@ def make_parser(): def intron_sizes( inputfile=None, outputfile=None, - key_name=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + key_name=None): """ Add a new key to transcript features containing a comma separated list of intron sizes. """ diff --git a/pygtftk/plugins/intronic.py b/pygtftk/plugins/intronic.py index 169b7d3e..40bebe28 100644 --- a/pygtftk/plugins/intronic.py +++ b/pygtftk/plugins/intronic.py @@ -1,12 +1,11 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys from builtins import str -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import chomp @@ -33,15 +32,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file (BED).", default=sys.stdout, metavar="BED", - type=FileWithExtension('w', - valid_extensions='\.[Bb][Ee][Dd]$')) + type=arg_formatter.bed_rw('w')) parser_grp.add_argument('-b', '--by-transcript', help="The intronic regions are returned for each" @@ -78,11 +75,8 @@ def intronic( names='transcript_id', separator="_", intron_nb_in_name=False, - tmp_dir=None, no_feature_name=False, - by_transcript=False, - logger_file=None, - verbosity=0): + by_transcript=False): """ Extract intronic regions. """ diff --git a/pygtftk/plugins/join_attr.py b/pygtftk/plugins/join_attr.py index adf14d04..979b70f8 100644 --- a/pygtftk/plugins/join_attr.py +++ b/pygtftk/plugins/join_attr.py @@ -1,11 +1,10 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -27,15 +26,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-k', '--key-to-join', help='The name of the key used to join (e.g transcript_id).', @@ -89,10 +86,7 @@ def join_attr( new_key=None, target_feature=None, key_to_join=None, - matrix=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + matrix=None): """ Join attributes from a tabulated file. """ diff --git a/pygtftk/plugins/join_multi_file.py b/pygtftk/plugins/join_multi_file.py index a41a2c95..696a0085 100644 --- a/pygtftk/plugins/join_multi_file.py +++ b/pygtftk/plugins/join_multi_file.py @@ -1,11 +1,9 @@ #!/usr/bin/env python -from __future__ import print_function - import argparse import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -27,15 +25,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-k', '--key-to-join', help='The name of the key used to join (e.g transcript_id).', @@ -50,7 +46,7 @@ def make_parser(): type=str, required=False) - parser_grp.add_argument('matrice_files', + parser_grp.add_argument('matrix_files', help="'A set of " "matrix files with row names as target keys column names as novel " "key and each cell as value.", @@ -65,10 +61,7 @@ def join_multi_file( outputfile=None, target_feature=None, key_to_join=None, - matrice_files=[], - tmp_dir=None, - logger_file=None, - verbosity=0): + matrix_files=()): """ Join attributes from a set of tabulated files. """ @@ -99,7 +92,7 @@ def join_multi_file( # Do it # ----------------------------------------------------------- - for join_file in matrice_files: + for join_file in matrix_files: gtf = gtf.add_attr_from_matrix_file(feat=target_feature, key=key_to_join, inputfile=join_file.name) diff --git a/pygtftk/plugins/merge_attr.py b/pygtftk/plugins/merge_attr.py index f2fd5e56..7e2b8633 100644 --- a/pygtftk/plugins/merge_attr.py +++ b/pygtftk/plugins/merge_attr.py @@ -1,11 +1,10 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -32,15 +31,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-k', '--src-key', help='Comma separated list of keys to join.', @@ -76,21 +73,18 @@ def merge_attr( src_key="gene_id,transcript_id", separator="|", target_feature="*", - dest_key="gene_tx_ids", - tmp_dir=None, - logger_file=None, - verbosity=None): + dest_key="gene_tx_ids"): """ Merge a set of attributes into a destination attribute. """ - gtf = GTF(inputfile, - check_ensembl_format=False - ).merge_attr(target_feature, - src_key, - dest_key, - separator).write(outputfile, - gc_off=True) + GTF(inputfile, + check_ensembl_format=False + ).merge_attr(target_feature, + src_key, + dest_key, + separator).write(outputfile, + gc_off=True) close_properly(outputfile, inputfile) diff --git a/pygtftk/plugins/midpoints.py b/pygtftk/plugins/midpoints.py index da7d2a02..3ce66752 100644 --- a/pygtftk/plugins/midpoints.py +++ b/pygtftk/plugins/midpoints.py @@ -1,6 +1,4 @@ #!/usr/bin/env python -from __future__ import division -from __future__ import print_function import argparse import os @@ -10,7 +8,7 @@ from future.utils import old_div from pybedtools import BedTool -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import chomp @@ -35,19 +33,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF/BED", - type=FileWithExtension('r', - valid_extensions=('\.[Gg][Tt][Ff](\.[Gg][Zz])?$', - '\.[Bb][Ee][Dd]$', - '\.[Bb][Ee][Dd]3$', - '\.[Bb][Ee][Dd]6$'))) + type=arg_formatter.gtf_or_bed_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file (BED).", default=sys.stdout, metavar="BED", - type=FileWithExtension('w', - valid_extensions=('\.[Bb][Ee][Dd]$', - '\.[Bb][Ee][Dd]6$'))) + type=arg_formatter.bed_rw('w')) parser_grp.add_argument('-t', '--ft-type', help="The target feature (as found in the 3rd " @@ -76,10 +68,7 @@ def midpoints( outputfile=None, ft_type="transcript", names="transcript_id", - separator="|", - tmp_dir=None, - logger_file=None, - verbosity=0): + separator="|"): """ Get the midpoint coordinates for the requested feature. """ diff --git a/pygtftk/plugins/mk_matrix.py b/pygtftk/plugins/mk_matrix.py index 4f962d07..d70f63d3 100644 --- a/pygtftk/plugins/mk_matrix.py +++ b/pygtftk/plugins/mk_matrix.py @@ -4,18 +4,18 @@ import argparse import os +import pyBigWig import sys import zipfile from builtins import range from builtins import str import pandas as pd -import pyBigWig from pybedtools import BedTool -from pygtftk.arg_formatter import FileWithExtension -from pygtftk.arg_formatter import checkChromFile -from pygtftk.arg_formatter import int_greater_than_null, int_ge_to_null +import pygtftk +from pygtftk import arg_formatter +from pygtftk.arg_formatter import CheckChromFile from pygtftk.bwig.bw_coverage import bw_profile_mp from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF @@ -46,16 +46,14 @@ def make_parser(): parser_grp.add_argument('bigwiglist', help='A list of Bigwig files (last argument).', - type=argparse.FileType('r'), + type=arg_formatter.bw_rw('r'), nargs='+') parser_grp.add_argument('-i', '--inputfile', help="A GTF file or bed file. A GTF if .", default=sys.stdin, metavar="GTF/BED", - type=FileWithExtension('r', - valid_extensions=('\.[Gg][Tt][Ff](\.[Gg][Zz])?$', - '\.[Bb][Ee][Dd]$'))) + type=arg_formatter.gtf_or_bed_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file name (.zip extension will be added).", @@ -85,38 +83,43 @@ def make_parser(): parser_grp.add_argument('-p', '--pseudo-count', help='Pseudo-count to add to all values.', default=0, - type=int_ge_to_null, + type=arg_formatter.ranged_num(lowest=0, highest=None, + val_type="float", linc=True), required=False) parser_grp.add_argument('-u', '--upstream', help="Extend the region of interest in 5' by a given value.", default=1000, - type=int_ge_to_null, + type=arg_formatter.ranged_num(lowest=0, highest=None, + val_type="int", linc=True), required=False) parser_grp.add_argument('-d', '--downstream', help="Extend the region of interest in 3' by a given value.", default=1000, - type=int_ge_to_null, + type=arg_formatter.ranged_num(lowest=0, highest=None, + val_type="int", linc=True), required=False) parser_grp.add_argument('-c', '--chrom-info', help='Tabulated file (chr as ' 'column 1, sizes as column 2.)', default=None, - action=checkChromFile, + action=CheckChromFile, required=True) parser_grp.add_argument('-w', '--bin-nb', help='Split the region into w bins.', default=100, - type=int_greater_than_null, + type=arg_formatter.ranged_num(lowest=1, highest=None, + val_type="int", linc=True), required=False) parser_grp.add_argument('-k', '--nb-proc', help='Use this many threads to compute coverage.', default=1, - type=int_greater_than_null, + type=arg_formatter.ranged_num(lowest=1, highest=None, + val_type="int", linc=True), required=False) parser_grp.add_argument('-b', '--bin-around-frac', @@ -156,10 +159,7 @@ def mk_matrix( nb_proc=None, labels=None, no_stranded=False, - tmp_dir=None, - logger_file=None, - zero_to_na=False, - verbosity=False): + zero_to_na=False): """ Description: Create a matrix to be used by 'profile' and 'heatmap' commands. """ @@ -382,7 +382,7 @@ def mk_matrix( labels=labels, outputfile=outputfile.name, zero_to_na=zero_to_na, - verbose=verbosity) + verbose=pygtftk.utils.VERBOSITY) outputfile_list["main"] = tmp_file @@ -435,7 +435,7 @@ def mk_matrix( labels=labels, outputfile=outputfile.name, zero_to_na=zero_to_na, - verbose=verbosity) + verbose=pygtftk.utils.VERBOSITY) outputfile_list["upstream"] = tmp_file @@ -473,7 +473,7 @@ def mk_matrix( labels=labels, outputfile=outputfile.name, zero_to_na=zero_to_na, - verbose=verbosity) + verbose=pygtftk.utils.VERBOSITY) outputfile_list["downstream"] = tmp_file @@ -620,14 +620,14 @@ def main(): #mk_matrix: every file contain 15 transcripts @test "mk_matrix_6" { - result=`rm -Rf simple_mat*; rm -Rf toto; gtftk mk_matrix -i simple.gtf -u 2 -d 2 -t transcript -w 4 simple.bw -o simple_mat -c simple.chromInfo -K toto; wc -l toto/*.bed | grep 15| wc -l` - [ "$result" -eq 6 ] + result=`rm -Rf simple_mat*; rm -Rf mk_matrix_6; gtftk mk_matrix -i simple.gtf -u 2 -d 2 -t transcript -w 4 simple.bw -o simple_mat -c simple.chromInfo -K mk_matrix_6 -k 1; wc -l mk_matrix_6/* | grep 15 | wc -l` + [ "$result" -eq 9 ] } #mk_matrix: test downstream + upstream (transcript) @test "mk_matrix_7" { - result=`rm -Rf simple_mat*; rm -Rf toto; gtftk mk_matrix -i simple.gtf -u 2 -d 2 -t transcript -w 4 simple.bw -o simple_mat -c simple.chromInfo ; unzip -u simple_mat.zip &>/dev/null; cut -f8,9,10,11 simple_mat| tail -14| perl -npe 's/\\t/|/g; s/\\n/,/g' | sed 's/0000000005//g' | sed 's/69999999995/7/g'` + result=`rm -Rf simple_mat*; rm -Rf mk_matrix_7; gtftk mk_matrix -i simple.gtf -u 2 -d 2 -t transcript -w 4 simple.bw -o simple_mat -c simple.chromInfo ; unzip -u simple_mat.zip &>/dev/null; cut -f8,9,10,11 simple_mat| tail -14| perl -npe 's/\\t/|/g; s/\\n/,/g' | sed 's/0000000005//g' | sed 's/69999999995/7/g'` [ "$result" = "3.666667|2.333333|1.666667|1.4,0.0|0.0|0.5|1.75,0.0|0.0|0.0|1.333333,0.0|0.0|0.0|0.0,0.0|0.0|0.0|0.0,2.666667|3.333333|2.0|2.666667,2.0|2.0|3.333333|3.0,2.5|2.0|1.5|2.0,1.0|1.0|1.0|1.0,1.0|1.0|1.0|1.0,1.5|2.0|2.0|1.0,0.0|0.666667|1.0|1.0,0.0|0.666667|1.0|1.0,0.0|0.0|0.0|0.4," ] } diff --git a/pygtftk/plugins/nb_exons.py b/pygtftk/plugins/nb_exons.py index 25d5375b..19500856 100644 --- a/pygtftk/plugins/nb_exons.py +++ b/pygtftk/plugins/nb_exons.py @@ -1,5 +1,4 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os @@ -7,7 +6,7 @@ from builtins import str from collections import defaultdict -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -29,19 +28,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="TXT/GTF", - type=FileWithExtension('w', - valid_extensions=('\.[Gg][Tt][Ff]$', - '\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]'))) + type=arg_formatter.gtf_or_txt_rw('w')) parser_grp.add_argument('-f', '--text-format', help="Return a text format.", @@ -59,11 +52,8 @@ def make_parser(): def nb_exons(inputfile=None, outputfile=None, - tmp_dir=None, key_name=None, - text_format=False, - logger_file=None, - verbosity=0): + text_format=False): """ Count the number of exons in the gtf file. """ diff --git a/pygtftk/plugins/nb_transcripts.py b/pygtftk/plugins/nb_transcripts.py index 97794325..7d6a3315 100644 --- a/pygtftk/plugins/nb_transcripts.py +++ b/pygtftk/plugins/nb_transcripts.py @@ -1,13 +1,11 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys from builtins import str -from collections import OrderedDict -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -29,19 +27,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF/TXT", - type=FileWithExtension('w', - valid_extensions=('(\.[Gg][Tt][Ff])$', - '\.[Tt][Xx][Tt]$', - '\.[Cc][Ss][Vv]$', - '\.[Tt][Aa][Bb]$', - '\.[Tt][Ss][Vv]$'))) + type=arg_formatter.gtf_or_txt_rw('w')) parser_grp.add_argument('-f', '--text-format', help="Return a text format.", @@ -59,17 +51,13 @@ def make_parser(): def nb_transcripts(inputfile=None, outputfile=None, - tmp_dir=None, text_format=False, - key_name="", - logger_file=None, - verbosity=0): + key_name=""): """ Compute the number of transcript per gene. """ gtf = GTF(inputfile) - n_tx = OrderedDict() message("Computing the number of transcript per gene in input GTF file.") diff --git a/pygtftk/plugins/overlapping.py b/pygtftk/plugins/overlapping.py index b2d9a595..d432cef9 100644 --- a/pygtftk/plugins/overlapping.py +++ b/pygtftk/plugins/overlapping.py @@ -1,6 +1,4 @@ #!/usr/bin/env python -from __future__ import division -from __future__ import print_function import argparse import os @@ -8,11 +6,10 @@ from builtins import str from collections import defaultdict -from pygtftk.arg_formatter import FileWithExtension -from pygtftk.arg_formatter import checkChromFile +from pygtftk import arg_formatter +from pygtftk.arg_formatter import CheckChromFile from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF -from pygtftk.utils import chrom_info_as_dict from pygtftk.utils import close_properly from pygtftk.utils import make_tmp_file from pygtftk.utils import message @@ -40,15 +37,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-c', '--chrom-info', help="Chromosome information. A tabulated two-columns" @@ -56,7 +51,7 @@ def make_parser(): " column 2", default=None, metavar="CHROMINFO", - action=checkChromFile, + action=CheckChromFile, required=True) parser_grp.add_argument('-u', '--upstream', @@ -122,21 +117,12 @@ def overlapping( same_strandedness=False, diff_strandedness=False, annotate_gtf=False, - tmp_dir=None, - logger_file=None, - invert_match=False, - verbosity=0): + invert_match=False): """ Description: Find transcripts whose body/TSS/TTS do or do not overlap with any transcript from another gene. """ - # ---------------------------------------------------------------------- - # Check chrom file - # ---------------------------------------------------------------------- - - chrom_dict = chrom_info_as_dict(chrom_info) - # ---------------------------------------------------------------------- # Prepare key names # ---------------------------------------------------------------------- diff --git a/pygtftk/plugins/profile.py b/pygtftk/plugins/profile.py index 4db89d88..9075a0e3 100644 --- a/pygtftk/plugins/profile.py +++ b/pygtftk/plugins/profile.py @@ -1,10 +1,10 @@ #!/usr/bin/env python -from __future__ import division import argparse import os import re import shutil +import sys import warnings import zipfile from builtins import range @@ -25,12 +25,11 @@ from plotnine import ggplot from plotnine import xlab from plotnine import ylab +from plotnine.exceptions import PlotnineError -from pygtftk.arg_formatter import FileWithExtension -from pygtftk.arg_formatter import float_greater_than_null -from pygtftk.arg_formatter import float_grt_than_null_and_lwr_than_one -from pygtftk.arg_formatter import int_greater_than_null +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject +from pygtftk.utils import ALL_MPL_PALETTES from pygtftk.utils import GTFtkError from pygtftk.utils import chomp from pygtftk.utils import is_hex_color @@ -45,13 +44,16 @@ """ __notes__ = """ - -- The ranging normalization method [1] implies the following transformation: - -- - (x_i - min(x))/(max(x) - min(x)). -- Think about using normalized bigWig files as input to mk_matrix. This will limit the requirement for an additional normalization step (see Deeptools for a set of useful methods implemented in bamCoverage/bamCompare). """ +''' + -- The ranging normalization method [1] implies the following transformation: + -- - (x_i - min(x))/(max(x) - min(x)). +''' + __references__ = """ -- [1] Numerical Ecology - second Edition - P. Legendre, L. Legendre (1998) Elsevier. """ @@ -68,7 +70,7 @@ def make_parser(): help='A zip file containing a matrix as produced by mk_matrix.', default=None, metavar='MATRIX', - type=FileWithExtension('r', '\.[Zz][Ii][Pp]'), + type=arg_formatter.zip_rw('r'), required=True) parser_grp.add_argument('-o', '--out-dir', @@ -123,13 +125,19 @@ def make_parser(): parser_grp.add_argument('-pw', '--page-width', help='Output pdf file width (e.g. 7 inches).', - type=int_greater_than_null, + type=arg_formatter.ranged_num(lowest=0, + highest=None, + val_type="float", + linc=False), default=None, required=False) parser_grp.add_argument('-ph', '--page-height', help='Output file height (e.g. 5 inches).', - type=int_greater_than_null, + type=arg_formatter.ranged_num(lowest=0, + highest=None, + val_type="float", + linc=False), default=None, required=False) @@ -141,7 +149,10 @@ def make_parser(): parser_grp.add_argument('-lw', '--line-width', help='Line width.', - type=float_greater_than_null, + type=arg_formatter.ranged_num(lowest=0, + highest=None, + val_type="float", + linc=False), default=1.25, required=False) @@ -178,12 +189,10 @@ def make_parser(): parser_grp.add_argument('-fc', '--facet-col', help='Number of facet columns.', default=4, - type=int_greater_than_null, - required=False) - - parser_grp.add_argument('-fo', '--force-tx-class', - help='Force even if some transcripts from --transcript-file were not found.', - action="store_true", + type=arg_formatter.ranged_num(lowest=1, + highest=None, + val_type="int", + linc=True), required=False) parser_grp.add_argument('-w', '--show-group-number', @@ -199,7 +208,10 @@ def make_parser(): parser_grp.add_argument('-ul', '--upper-limit', - type=float_grt_than_null_and_lwr_than_one, + type=arg_formatter.ranged_num(lowest=0, + highest=1, + val_type="float", + linc=False), default=0.95, help='Upper limit based on quantile computed from unique values.', required=False) @@ -224,7 +236,10 @@ def make_parser(): parser_grp.add_argument('-dpi', '--dpi', help='Dpi to use.', - type=int_greater_than_null, + type=arg_formatter.ranged_num(lowest=50, + highest=None, + val_type="int", + linc=True), default=300, required=False) @@ -252,6 +267,10 @@ def make_parser(): default="nipy_spectral", required=False) + parser_grp.add_argument('-l', '--list-bwig', + help='List the bigwig files in the matrix file..', + action="store_true") + return parser @@ -260,11 +279,9 @@ def profile(inputfile=None, group_by='bwig', color_order=None, transcript_file=None, - transform=None, normalization_method=None, to_log=False, upper_limit=0.95, - quantiles=False, profile_colors=None, palette='nipy_spectral', page_width=None, @@ -272,10 +289,8 @@ def profile(inputfile=None, page_height=None, page_format='pdf', user_img_file=None, - tmp_dir=None, facet_col=None, border_color="#BBBBBB", - force_tx_class=False, stat="mean", facet_var=None, x_lab="Selected genomic regions", @@ -285,11 +300,9 @@ def profile(inputfile=None, show_group_number=False, line_width=1, theme_plotnine='bw', + list_bwig=False, confidence_interval=False, - dpi=300, - logger_file=None, - verbosity=False - ): + dpi=300): # ------------------------------------------------------------------------- # # Pandas version is sometimes problematic @@ -385,6 +398,10 @@ def profile(inputfile=None, input_file_chrom.add(chrom) input_file_bwig.add(field[0]) + if list_bwig: + message("Bigwig list: " + ",".join(input_file_bwig), force=True) + sys.exit(0) + # ------------------------------------------------------------------------- # # Parse the header @@ -484,11 +501,11 @@ def profile(inputfile=None, # Select the transcript of interest and add classes info to the data.frame # ------------------------------------------------------------------------- - message("Checking how many genes where found in the transcript list.") + message("Checking how many transcript where found in the transcript list.") nb_retained = len([x for x in all_tx if x in tx_ordering]) - msg = "Keeping {a} transcript out of {b}.".format(a=nb_retained, b=len(all_tx)) + msg = "Keeping {a} transcript out of {b} in input transcript list.".format(a=nb_retained, b=len(all_tx)) message(msg) # subsetting @@ -507,23 +524,7 @@ def profile(inputfile=None, # # ------------------------------------------------------------------------- - all_palettes = ['viridis', 'plasma', 'inferno', 'magma', - 'Greys', 'Purples', 'Blues', 'Greens', 'Oranges', 'Reds', - 'YlOrBr', 'YlOrRd', 'OrRd', 'PuRd', 'RdPu', 'BuPu', - 'GnBu', 'PuBu', 'YlGnBu', 'PuBuGn', 'BuGn', 'YlGn', - 'binary', 'gist_yarg', 'gist_gray', 'gray', 'bone', 'pink', - 'spring', 'summer', 'autumn', 'winter', 'cool', 'Wistia', - 'hot', 'afmhot', 'gist_heat', 'copper', - 'PiYG', 'PRGn', 'BrBG', 'PuOr', 'RdGy', 'RdBu', - 'RdYlBu', 'RdYlGn', 'Spectral', 'coolwarm', 'bwr', 'seismic', - 'Pastel1', 'Pastel2', 'Paired', 'Accent', - 'Dark2', 'Set1', 'Set2', 'Set3', - 'tab10', 'tab20', 'tab20b', 'tab20c', - 'flag', 'prism', 'ocean', 'gist_earth', 'terrain', 'gist_stern', - 'gnuplot', 'gnuplot2', 'CMRmap', 'cubehelix', 'brg', 'hsv', - 'gist_rainbow', 'rainbow', 'jet', 'nipy_spectral', 'gist_ncar'] - - if palette not in all_palettes: + if palette not in ALL_MPL_PALETTES: message("Sorry but the palette is unknown.") def get_list_of_colors_mpl(number, pal=palette): @@ -620,7 +621,7 @@ def get_list_of_colors_mpl(number, pal=palette): if curr_item not in input_file_bwig: message("Color order: Found undefined bigwig labels (" + curr_item + ")... Please Check.", type="WARNING") - message("Use one of :" + ",".join(input_file_bwig) + ".", + message("Use one of : " + ",".join(input_file_bwig) + ".", type="ERROR") elif group_by == 'tx_classes': @@ -649,8 +650,8 @@ def get_list_of_colors_mpl(number, pal=palette): if len(color_order) < len(profile_colors): profile_colors = profile_colors[:len(color_order)] - message("Color order :" + str(color_order), type="DEBUG") - message("Profile color :" + str(profile_colors), type="DEBUG") + message("Color order : " + str(color_order), type="DEBUG") + message("Profile color : " + str(profile_colors), type="DEBUG") # ------------------------------------------------------------------------- # @@ -1218,7 +1219,12 @@ def fxn(): fxn() message("Saving diagram to file : " + img_file.name) message("Be patient. This may be long for large datasets.") - p.save(filename=img_file.name, width=page_width, height=page_height, dpi=dpi, limitsize=False) + try: + p.save(filename=img_file.name, width=page_width, height=page_height, dpi=dpi, limitsize=False) + except PlotnineError as err: + message("Plotnine message: " + err.message) + message("Plotnine encountered an error.", type="ERROR") + dm.to_csv(data_file, sep="\t", header=True, index=False) # Delete temporary dir @@ -1229,7 +1235,7 @@ def fxn(): myparser = make_parser() args = myparser.parse_args() args = dict(args.__dict__) - draw_profile(**args) + profile(**args) else: diff --git a/pygtftk/plugins/random_list.py b/pygtftk/plugins/random_list.py index 73803484..15d23c7c 100644 --- a/pygtftk/plugins/random_list.py +++ b/pygtftk/plugins/random_list.py @@ -1,5 +1,5 @@ #!/usr/bin/env python -from __future__ import print_function + import argparse import os @@ -7,12 +7,9 @@ import sys from builtins import str -from pygtftk.arg_formatter import FileWithExtension -from pygtftk.arg_formatter import int_greater_than_null +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF -from pygtftk.utils import PY2 -from pygtftk.utils import PY3 from pygtftk.utils import close_properly from pygtftk.utils import message @@ -33,21 +30,22 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-n', '--number', help="The number of transcripts or gene to select.", default=1, metavar="NUMBER", - type=int_greater_than_null, + type=arg_formatter.ranged_num(lowest=1, + highest=None, + linc=True, + val_type='int'), required=False) parser_grp.add_argument('-t', '--ft-type', @@ -60,7 +58,10 @@ def make_parser(): help="Seed value for the random number generator.", default=None, metavar="SEED", - type=int_greater_than_null, + type=arg_formatter.ranged_num(lowest=1, + highest=None, + linc=True, + val_type='int'), required=False) return parser @@ -71,10 +72,7 @@ def random_list( outputfile=None, number=None, ft_type=None, - seed_value=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + seed_value=None): """ Select a random list of genes or transcripts. """ @@ -96,13 +94,7 @@ def random_list( number = len(id_list) if seed_value is not None: - - if PY2: - random.seed(seed_value) - elif PY3: - random.seed(seed_value, version=1) - else: - message("Unknow Python version", type="ERROR") + random.seed(seed_value, version=1) id_list = random.sample(id_list, number) diff --git a/pygtftk/plugins/random_tx.py b/pygtftk/plugins/random_tx.py index 7e772571..7302dc21 100644 --- a/pygtftk/plugins/random_tx.py +++ b/pygtftk/plugins/random_tx.py @@ -1,5 +1,4 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os @@ -7,12 +6,9 @@ import sys from builtins import range -from pygtftk.arg_formatter import FileWithExtension -from pygtftk.arg_formatter import int_greater_than_null +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF -from pygtftk.utils import PY2 -from pygtftk.utils import PY3 from pygtftk.utils import close_properly from pygtftk.utils import message @@ -32,28 +28,32 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-m', '--max-transcript', help="The maximum number of transcripts to select for each gene.", default=1, metavar="MAX", - type=int_greater_than_null, + type=arg_formatter.ranged_num(lowest=1, + highest=None, + linc=True, + val_type='int'), required=False) parser_grp.add_argument('-s', '--seed-value', help="Seed value for the random number generator.", default=None, metavar="SEED", - type=int_greater_than_null, + type=arg_formatter.ranged_num(lowest=1, + highest=None, + linc=True, + val_type='int'), required=False) return parser @@ -63,10 +63,7 @@ def random_tx( inputfile=None, outputfile=None, max_transcript=None, - seed_value=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + seed_value=None): """ Select randomly up to m transcript for each gene. """ @@ -88,12 +85,7 @@ def random_tx( message("Selecting random transcript") if seed_value is not None: - if PY3: - # Unfortunatly 'version 1' - # is not back-compatible... - random.seed(seed_value, version=1) - elif PY2: - random.seed(seed_value) + random.seed(seed_value, version=1) tx_to_delete = [] @@ -108,11 +100,11 @@ def random_tx( message("Printing results") message("Selecting transcript.") - gtf = gtf.select_by_key("transcript_id", - ",".join(tx_to_delete), - invert_match=True - ).write(outputfile, - gc_off=True) + gtf.select_by_key("transcript_id", + ",".join(tx_to_delete), + invert_match=True + ).write(outputfile, + gc_off=True) close_properly(outputfile, inputfile) diff --git a/pygtftk/plugins/retrieve.py b/pygtftk/plugins/retrieve.py index d1076689..60c9ee78 100644 --- a/pygtftk/plugins/retrieve.py +++ b/pygtftk/plugins/retrieve.py @@ -1,5 +1,4 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os @@ -9,7 +8,8 @@ import ftputil from ftputil.error import FTPOSError -from pygtftk.arg_formatter import FileWithExtension +import pygtftk +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import message @@ -36,8 +36,7 @@ def make_parser(): parser_grp.add_argument('-o', '--outputfile', help="Output file (gtf.gz).", metavar="GTF.GZ", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]\.[Gg][Zz]$')) + type=arg_formatter.gtf_rwb('w')) parser_grp.add_argument('-e', '--ensembl-collection', help="Which ensembl collection to interrogate" @@ -85,14 +84,11 @@ def make_parser(): def retrieve(species_name=None, outputfile=None, release='Latest', - tmp_dir=None, to_stdout=False, list_only=False, - logger_file=None, delete=False, hide_species_name=None, - ensembl_collection='vertebrate', - verbosity=0): + ensembl_collection='vertebrate'): """Retrieve a GTF file from ensembl. :Example: @@ -136,7 +132,7 @@ def retrieve(species_name=None, try: ftp = ftputil.FTPHost(host, user, password) - if verbosity: + if pygtftk.utils.VERBOSITY: message("Connected to ensembl FTP website.") except FTPOSError as err: message(str(err)) diff --git a/pygtftk/plugins/rm_dup_tss.py b/pygtftk/plugins/rm_dup_tss.py index faa99ee7..9f468b73 100644 --- a/pygtftk/plugins/rm_dup_tss.py +++ b/pygtftk/plugins/rm_dup_tss.py @@ -11,7 +11,7 @@ from pybedtools import BedTool -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import make_tmp_file @@ -36,24 +36,19 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) return parser def rm_dup_tss(inputfile=None, - outputfile=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + outputfile=None): """If several transcripts of a gene share the same tss, select only one.""" # ---------------------------------------------------------------------- @@ -150,7 +145,7 @@ def main(): #Check no duplicate TSS exists @test "rm_dup_tss_3" { - result=$(gtftk get_example -d simple_05 | gtftk rm_dup_tss | perl -ne 'print if (/(G0001T002)|(G0003T002)|(G0004T002)|(G0006T002)|(G0007T002)|(G0008T002)/)' out_rm.gtf) + result=$(gtftk get_example -d simple_05 | gtftk rm_dup_tss | perl -ne 'print if (/(G0001T002)|(G0003T002)|(G0004T002)|(G0006T002)|(G0007T002)|(G0008T002)/)') [ -z $result ] } @@ -169,7 +164,7 @@ def main(): #Check with rmdup (now 1 tx with the same TSS) @test "rm_dup_tss_6" { - result=$(gtftk get_example -d mini_real | gtftk rm_dup_tss | gtftk select_by_key -t | gtftk get_5p_3p_coords -n gene_name | cut -f2,4 | awk 'BEGIN{n=0};{ if($2=="PCDH15" && $1=="54801290"){n++}}END{print n}') + result=$( gtftk get_example -d mini_real | gtftk rm_dup_tss | gtftk select_by_key -t | gtftk get_5p_3p_coords -n gene_name | cut -f2,4 | awk 'BEGIN{n=0};{ if($2=="PCDH15" && $1=="54801290"){n++}}END{print n}') [ $result -eq 1 ] } diff --git a/pygtftk/plugins/select_by_go.py b/pygtftk/plugins/select_by_go.py index 356f5eb7..f86202e7 100644 --- a/pygtftk/plugins/select_by_go.py +++ b/pygtftk/plugins/select_by_go.py @@ -1,12 +1,11 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys from collections import OrderedDict -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.biomart import Biomart from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF @@ -27,15 +26,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser.add_argument('-g', '--go-id', help='The GO ID (with or without "GO:" prefix).', @@ -92,10 +89,7 @@ def select_by_go(inputfile=None, http_proxy=None, list_datasets=None, species=None, - invert_match=False, - tmp_dir=None, - logger_file=None, - verbosity=0): + invert_match=False): """ Select lines from a GTF file based using a Gene Ontology ID (e.g GO:0050789). """ diff --git a/pygtftk/plugins/select_by_intron_size.py b/pygtftk/plugins/select_by_intron_size.py index 668554b3..06679701 100644 --- a/pygtftk/plugins/select_by_intron_size.py +++ b/pygtftk/plugins/select_by_intron_size.py @@ -1,5 +1,4 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os @@ -8,7 +7,7 @@ from collections import OrderedDict from collections import defaultdict -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -36,15 +35,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-s', '--intron-size', help="The minimum intron size.", @@ -78,10 +75,7 @@ def select_by_intron_size( merged=False, invert_match=False, delete_monoexonic=False, - add_intron_size=False, - tmp_dir=None, - logger_file=None, - verbosity=0): + add_intron_size=False): """ Select genes which contain an intron of size at least s or whose sum of intron size is at least s """ diff --git a/pygtftk/plugins/select_by_key.py b/pygtftk/plugins/select_by_key.py index e5e12f3a..2cdf537e 100644 --- a/pygtftk/plugins/select_by_key.py +++ b/pygtftk/plugins/select_by_key.py @@ -1,23 +1,24 @@ #!/usr/bin/env python -from __future__ import division -from __future__ import print_function import argparse import os import sys -from pygtftk.arg_formatter import FileWithExtension -from pygtftk.arg_formatter import int_greater_than_null +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly from pygtftk.utils import message __updated__ = "2018-01-31" -__doc__ = """ +__doc__ = ''' Select lines from a GTF file based on attributes and associated values. -""" +''' + +__notes__ = ''' +-- select_by_key only returns lines for which the key is defined (i.e. exists) even with -\-invert-match. +''' def make_parser(): @@ -31,15 +32,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-k', '--key', help='The key name.', @@ -64,7 +63,10 @@ def make_parser(): help='The column number (one-based) that contains the values in the file. File is tab-delimited.', default=1, metavar="COL", - type=int_greater_than_null, + type=arg_formatter.ranged_num(lowest=1, + highest=None, + linc=True, + val_type='int'), required=False) parser_grp.add_argument('-n', '--invert-match', @@ -126,7 +128,6 @@ def select_by_key(inputfile=None, key=None, value=None, invert_match=False, - tmp_dir=None, file_with_values=None, col=0, select_transcripts=False, @@ -137,9 +138,7 @@ def select_by_key(inputfile=None, bed_format=False, log=False, separator="|", - names="transcript_id", - logger_file=None, - verbosity=0): + names="transcript_id"): """Select lines from a GTF file based on attributes and associated values. """ @@ -168,18 +167,16 @@ def select_by_key(inputfile=None, key = "feature" value = "exon" - elif value is not None and key is None: - message("Please set -k.", - type="ERROR") - - elif value is None and file_with_values is None: - if key is not None: - message("Key and value are mandatory. Alternatively use -e/t/g/f.", + elif file_with_values is None: + if key is None or value is None: + message("Key and value are mandatory. Alternatively use -e/t/g/f or -f with -k.", type="ERROR") elif file_with_values is not None: if key is None: message("Please set -k.", type="ERROR") + if value is not None: + message("The -f and -v arguments are mutually exclusive.", type="ERROR") # ---------------------------------------------------------------------- # Load file with value @@ -309,7 +306,7 @@ def main(): # Select_by_key: Feature selection. --file-with-values -col @test "select_by_key_6" { - result=`gtftk select_by_key -k gene_id -i simple.gtf -f simple.geneList -c 3| wc -l` + result=`rm -f /tmp/test_select_by_key.gtf; gtftk select_by_key -k gene_id -i simple.gtf -f simple.geneList -c 3| wc -l` [ "$result" -eq 18 ] } diff --git a/pygtftk/plugins/select_by_loc.py b/pygtftk/plugins/select_by_loc.py index a220113e..ea7bda00 100644 --- a/pygtftk/plugins/select_by_loc.py +++ b/pygtftk/plugins/select_by_loc.py @@ -1,5 +1,4 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os @@ -10,7 +9,7 @@ from pybedtools.bedtool import BedTool -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -37,15 +36,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_mut = parser.add_mutually_exclusive_group(required=True) @@ -79,10 +76,7 @@ def select_by_loc(inputfile=None, location=None, ft_type=None, invert_match=False, - tmp_dir=None, - location_file=None, - logger_file=None, - verbosity=0): + location_file=None): """ Select transcripts overlapping a given locations. """ @@ -140,25 +134,25 @@ def select_by_loc(inputfile=None, if not invert_match: - out = gtf.select_by_key(ft_type + '_id', - ",".join(id_list), - invert_match=invert_match).write(outputfile, - gc_off=True) + gtf.select_by_key(ft_type + '_id', + ",".join(id_list), + invert_match=invert_match).write(outputfile, + gc_off=True) else: if ft_type == 'transcript': - out = gtf.select_by_key('transcript_id', - ",".join(id_list), - invert_match=invert_match, - no_na=True - ).write(outputfile, - gc_off=True) + gtf.select_by_key('transcript_id', + ",".join(id_list), + invert_match=invert_match, + no_na=True + ).write(outputfile, + gc_off=True) else: - out = gtf.select_by_key('gene_id', - ",".join(id_list), - invert_match=invert_match - ).write(outputfile, - gc_off=True) + gtf.select_by_key('gene_id', + ",".join(id_list), + invert_match=invert_match + ).write(outputfile, + gc_off=True) close_properly(outputfile, inputfile) diff --git a/pygtftk/plugins/select_by_max_exon_nb.py b/pygtftk/plugins/select_by_max_exon_nb.py index bb6eb806..2a2592da 100644 --- a/pygtftk/plugins/select_by_max_exon_nb.py +++ b/pygtftk/plugins/select_by_max_exon_nb.py @@ -1,18 +1,17 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import message __updated__ = "2018-02-11" __doc__ = """ -For each gene select the transcript with the highest number of exons. +For each gene select the transcript with the highest number of exons. If ties, select the first encountered. """ @@ -24,24 +23,19 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) return parser def select_by_max_exon_nb(inputfile=None, - outputfile=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + outputfile=None): """ Select transcripts based on the number of exons. """ diff --git a/pygtftk/plugins/select_by_nb_exon.py b/pygtftk/plugins/select_by_nb_exon.py index 71941c87..7b148c43 100644 --- a/pygtftk/plugins/select_by_nb_exon.py +++ b/pygtftk/plugins/select_by_nb_exon.py @@ -1,12 +1,11 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys from builtins import str -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -26,15 +25,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser.add_argument('-m', '--min-exon-number', help="Minimum number of exons.", @@ -51,11 +48,7 @@ def make_parser(): def select_by_nb_exon(inputfile=None, outputfile=None, min_exon_number=None, - max_exon_number=None, - tmp_dir=None, - force_gtf=False, - logger_file=None, - verbosity=0): + max_exon_number=None): """ Select transcripts based on the number of exons. """ diff --git a/pygtftk/plugins/select_by_numeric_value.py b/pygtftk/plugins/select_by_numeric_value.py index 8fb14886..1928cd00 100644 --- a/pygtftk/plugins/select_by_numeric_value.py +++ b/pygtftk/plugins/select_by_numeric_value.py @@ -1,11 +1,10 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -29,15 +28,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser.add_argument('-t', '--test', help='The test to be applied.', @@ -57,18 +54,15 @@ def make_parser(): def select_by_numeric_value(inputfile=None, outputfile=None, test=None, - na_omit=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + na_omit=None): """Select lines from a GTF file based on a boolean test on numeric values. """ - gtf = GTF(inputfile, check_ensembl_format=False - ).select_by_numeric_value(test, - na_omit=na_omit, - ).write(outputfile, - gc_off=True) + GTF(inputfile, + check_ensembl_format=False).select_by_numeric_value(test, + na_omit=na_omit, + ).write(outputfile, + gc_off=True) close_properly(outputfile, inputfile) diff --git a/pygtftk/plugins/select_by_regexp.py b/pygtftk/plugins/select_by_regexp.py index 3f21a690..4c6bdc73 100644 --- a/pygtftk/plugins/select_by_regexp.py +++ b/pygtftk/plugins/select_by_regexp.py @@ -1,11 +1,11 @@ #!/usr/bin/env python -from __future__ import print_function + import argparse import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -15,6 +15,11 @@ Select lines from a GTF file based on a regexp. """ +__notes__ = """ + -- The default is to try to select feature from conventional human chromosome (chr1..chr22, chrX and chrY) with + -\-key set to chrom and -\-regexp set to "^chr[0-9XY]+$". +""" + def make_parser(): """The program parser.""" @@ -24,28 +29,24 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser.add_argument('-k', '--key', help='The key name', default="chrom", metavar="KEY", - type=str, - required=True) + type=str) parser.add_argument('-r', '--regexp', help='The regular expression.', default="^chr[0-9XY]+$", - type=str, - required=True) + type=str) parser.add_argument('-n', '--invert-match', help='Not/invert match. Selected lines whose requested key ' @@ -59,20 +60,17 @@ def select_by_regexp(inputfile=None, outputfile=None, key=None, regexp=None, - invert_match=False, - tmp_dir=None, - logger_file=None, - verbosity=0): + invert_match=False): """Select lines from a GTF file based on attributes and associated values. """ - gtf = GTF(inputfile, check_ensembl_format=False - ).select_by_regexp(key, - regexp, - invert_match - ).write(outputfile, - gc_off=True) + GTF(inputfile, + check_ensembl_format=False).select_by_regexp(key, + regexp, + invert_match + ).write(outputfile, + gc_off=True) close_properly(outputfile, inputfile) @@ -124,5 +122,6 @@ def main(): fun=os.path.abspath(__file__), group="selection", desc=__doc__, + notes=__notes__, updated=__updated__, test=test) diff --git a/pygtftk/plugins/select_by_tx_size.py b/pygtftk/plugins/select_by_tx_size.py index 344a372b..f14cbd4e 100644 --- a/pygtftk/plugins/select_by_tx_size.py +++ b/pygtftk/plugins/select_by_tx_size.py @@ -1,12 +1,11 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys from builtins import str -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import message @@ -26,15 +25,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser.add_argument('-m', '--min-size', help="Minimum size.", @@ -52,10 +49,7 @@ def make_parser(): def select_by_tx_size(inputfile=None, outputfile=None, min_size=None, - max_size=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + max_size=None): """ Select features by size. """ @@ -65,18 +59,18 @@ def select_by_tx_size(inputfile=None, M=str(max_size)) message(msg) - gtf = GTF(inputfile - ).select_by_transcript_size(min_size, - max_size - ).write(outputfile, - gc_off=True) + GTF(inputfile + ).select_by_transcript_size(min_size, + max_size + ).write(outputfile, + gc_off=True) def main(): myparser = make_parser() args = myparser.parse_args() args = dict(args.__dict__) - select_by_transcript_size(**args) + select_by_tx_size(**args) if __name__ == '__main__': diff --git a/pygtftk/plugins/select_most_5p_tx.py b/pygtftk/plugins/select_most_5p_tx.py index 94a587ab..413d23d6 100644 --- a/pygtftk/plugins/select_most_5p_tx.py +++ b/pygtftk/plugins/select_most_5p_tx.py @@ -1,11 +1,11 @@ #!/usr/bin/env python -from __future__ import print_function + import argparse import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import message @@ -30,15 +30,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser.add_argument('-g', '--keep-gene-lines', help="Add gene lines to the output", @@ -48,10 +46,7 @@ def make_parser(): def select_most_5p_tx(inputfile=None, outputfile=None, - keep_gene_lines=False, - tmp_dir=None, - logger_file=None, - verbosity=0): + keep_gene_lines=False): """ Select the most 5' transcript of each gene. """ diff --git a/pygtftk/plugins/seqid_list.py b/pygtftk/plugins/seqid_list.py index 5cf8d7b1..d8826ebe 100644 --- a/pygtftk/plugins/seqid_list.py +++ b/pygtftk/plugins/seqid_list.py @@ -1,12 +1,11 @@ #!/usr/bin/env python -from __future__ import print_function import argparse import os import sys from builtins import str -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -27,18 +26,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="TXT", - type=FileWithExtension('w', - valid_extensions=('\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]'))) + type=arg_formatter.txt_rw('w')) parser_grp.add_argument('-s', '--separator', help="The separator to be used for separating key names.", @@ -52,10 +46,7 @@ def make_parser(): def seqid_list( inputfile=None, outputfile=None, - tmp_dir=None, - separator="", - logger_file=None, - verbosity=0): + separator=""): """ Select the seqid/chromosomes. """ @@ -71,7 +62,7 @@ def main(): myparser = make_parser() args = myparser.parse_args() args = dict(args.__dict__) - count(**args) + seqid_list(**args) if __name__ == '__main__': diff --git a/pygtftk/plugins/shift.py b/pygtftk/plugins/shift.py index d06fd65d..7b426af3 100644 --- a/pygtftk/plugins/shift.py +++ b/pygtftk/plugins/shift.py @@ -1,12 +1,10 @@ #!/usr/bin/env python -from __future__ import print_function - import argparse import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.arg_formatter import chromFileAsDict from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF @@ -17,6 +15,7 @@ __doc__ = """ Transpose coordinates in 3' or 5' direction. """ + __notes__ = """ -- By default shift is not strand specific. Meaning that if -\shift-value is set to 10, all coordinates will be moved 10 bases in 5' direction relative to the forward/watson/plus/top strand. -- Use a negative value to shift in 3' direction, a positive value to shift in 5' direction. @@ -36,15 +35,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions='\.[Gg][Tt][Ff]$')) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-s', '--shift-value', help="Shift coordinate by s nucleotides.", @@ -75,12 +72,9 @@ def make_parser(): def shift(inputfile=None, outputfile=None, shift_value=None, - tmp_dir=None, chrom_info=None, stranded=False, - allow_outside=False, - logger_file=None, - verbosity=0): + allow_outside=False): """Shift coordinates in 3' or 5' direction. """ diff --git a/pygtftk/plugins/short_long.py b/pygtftk/plugins/short_long.py index 2cd9445f..67918dc3 100644 --- a/pygtftk/plugins/short_long.py +++ b/pygtftk/plugins/short_long.py @@ -1,16 +1,14 @@ # -*- coding: utf-8 -*- -from __future__ import print_function + """ Select the shortest mature transcript (i.e without introns) for each gene or the longest if the \ -l arguments is used. """ -import os - -__updated__ = "2018-01-25" import argparse +import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF @@ -31,15 +29,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions=('\.[Gg][Tt][Ff](\.[Gg][Zz])?$'))) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="GTF", - type=FileWithExtension('w', - valid_extensions=('\.[Gg][Tt][Ff]$'))) + type=arg_formatter.gtf_rw('w')) parser_grp.add_argument('-l', '--longs', help="Take the longest transcript of each gene", @@ -55,10 +51,7 @@ def make_parser(): def short_long(inputfile=None, outputfile=None, longs=None, - keep_gene_lines=False, - tmp_dir=None, - logger_file=None, - verbosity=0): + keep_gene_lines=False): """ Select the shortest transcript for each gene, Or the longuest if the \ -l arguments is used. """ diff --git a/pygtftk/plugins/splicing_site.py b/pygtftk/plugins/splicing_site.py index 01ff23d8..1611af0d 100644 --- a/pygtftk/plugins/splicing_site.py +++ b/pygtftk/plugins/splicing_site.py @@ -1,21 +1,23 @@ #!/usr/bin/env python -from __future__ import print_function + import argparse import os import sys from builtins import str -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly from pygtftk.utils import message __updated__ = "2018-01-20" + __doc__ = """ Compute the locations of donor and acceptor splice sites. """ + __notes__ = """ This will return a single position which corresponds to the most 5' and/or the most 3' intronic region. If the gtf file does not contain exon numbering you can compute it using the add_exon_nb command. @@ -33,16 +35,13 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$') - ) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="BED", - type=FileWithExtension('w', - valid_extensions='\.[bB][eE][dD]$') + type=arg_formatter.bed_rw('w') ) parser_grp.add_argument('-k', '--exon-numbering-key', @@ -68,10 +67,7 @@ def splicing_site(inputfile=None, outputfile=None, exon_numbering_key=False, names="exon_id,transcript_id,gene_id", - separator="\t", - tmp_dir=None, - logger_file=None, - verbosity=0): + separator="\t"): """ Compute the locations of splice donor are acceptor sites. You may extend them in 3' and 5' depending on your needs. """ diff --git a/pygtftk/plugins/tabulate.py b/pygtftk/plugins/tabulate.py index 03386235..04ff40d6 100644 --- a/pygtftk/plugins/tabulate.py +++ b/pygtftk/plugins/tabulate.py @@ -1,13 +1,10 @@ #!/usr/bin/env python -from __future__ import print_function - import argparse -import errno import os import sys -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly @@ -15,9 +12,11 @@ from pygtftk.utils import write_properly __updated__ = "2018-01-20" + __doc__ = """ Convert a GTF to tabulated format. """ + __notes__ = """ -- Warning: by default tabulate will discard any line for which one of the selected key is not defined. Use -x (-\-accept-undef) to print them. -- To refer to default keys use: seqid,source,feature,start,end,frame,gene_id... @@ -37,18 +36,14 @@ def make_parser(): help="Path to the GTF file. Default to STDIN", default=sys.stdin, metavar="GTF", - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="TXT", - type=FileWithExtension('w', - valid_extensions=('\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]'))) + type=arg_formatter.txt_rw('w')) + parser_grp.add_argument('-s', '--separator', help="The output field separator.", default="\t", @@ -114,7 +109,6 @@ def make_parser(): def tabulate(inputfile=None, outputfile=None, key=None, - tmp_dir=None, no_unset=False, unique=False, no_basic=False, @@ -124,9 +118,7 @@ def tabulate(inputfile=None, select_transcript_ids=False, select_exon_ids=False, separator="\t", - logger_file=None, - no_header=False, - verbosity=0): + no_header=False): """Convert a GTF to tabulated format. """ @@ -229,9 +221,14 @@ def tabulate(inputfile=None, if t not in printed: i.write(outputfile, separator) printed[t] = 1 - except IOError as e: - if e.errno == errno.EPIPE: - message("Received a boken pipe signal", type="WARNING") + + except (BrokenPipeError, IOError): + def _void_f(*args, **kwargs): + pass + + message("Received a boken pipe signal", type="WARNING") + sys.stdout.write = _void_f + sys.stdout.flush = _void_f close_properly(outputfile, inputfile) diff --git a/pygtftk/plugins/tss_dist.py b/pygtftk/plugins/tss_dist.py index c0bcdbb9..e0999e69 100644 --- a/pygtftk/plugins/tss_dist.py +++ b/pygtftk/plugins/tss_dist.py @@ -1,21 +1,21 @@ #!/usr/bin/env python -from __future__ import print_function + import argparse -import errno import os import sys from builtins import range from builtins import str from collections import defaultdict -from pygtftk.arg_formatter import FileWithExtension +from pygtftk import arg_formatter from pygtftk.cmd_object import CmdObject from pygtftk.gtf_interface import GTF from pygtftk.utils import close_properly from pygtftk.utils import message __updated__ = "2018-01-20" + __doc__ = """ Computes the distance between TSSs of pairs of gene transcripts. """ @@ -38,29 +38,20 @@ def make_parser(): default=sys.stdin, metavar="GTF", required=False, - type=FileWithExtension('r', - valid_extensions='\.[Gg][Tt][Ff](\.[Gg][Zz])?$')) + type=arg_formatter.gtf_rwb('r')) parser_grp.add_argument('-o', '--outputfile', help="Output file.", default=sys.stdout, metavar="TXT", - type=FileWithExtension('w', - valid_extensions=('\.[Tt][Xx][Tt]', - '\.[Cc][Ss][Vv]', - '\.[Tt][Aa][Bb]', - '\.[Tt][Ss][Vv]', - '\.[Cc][Oo][Vv]'))) + type=arg_formatter.txt_rw('w')) return parser def tss_dist( inputfile=None, - outputfile=None, - tmp_dir=None, - logger_file=None, - verbosity=0): + outputfile=None): """ Computes the distance between TSS of gene transcripts. """ @@ -112,9 +103,15 @@ def tss_dist( str(tss_2), str(tss_1)]) + "\n" outputfile.write(str_out) - except IOError as e: - if e.errno == errno.EPIPE: - message("Received a boken pipe signal", type="WARNING") + + + except (BrokenPipeError, IOError): + def _void_f(*args, **kwargs): + pass + + message("Received a boken pipe signal", type="WARNING") + sys.stdout.write = _void_f + sys.stdout.flush = _void_f close_properly(outputfile, inputfile) @@ -149,6 +146,21 @@ def main(): result=`gtftk get_example -d mini_real | gtftk tss_dist | grep ENSG00000097007 | cut -f4 | perl -npe 's/\\n/,/' ` [ "$result" = "121120,121086,34," ] } + + @test "tss_dist_4" { + result=`gtftk get_example -d simple_03 | gtftk tss_dist | grep G0002T002| cut -f 4 ` + [ "$result" -eq 5 ] + } + + @test "tss_dist_4" { + result=`gtftk get_example -d simple_03 | gtftk tss_dist | grep G0011T001| cut -f 4 ` + [ "$result" -eq 13 ] + } + + @test "tss_dist_5" { + result=`gtftk get_example -d simple_06 | gtftk tss_dist | md5sum-lite | perl -npe 's/\\s.*//'` + [ "$result" = "8ed7258ed14b5cb518332b1f29d31e5e" ] + } """ diff --git a/pygtftk/settings.py b/pygtftk/settings.py index 983c24bc..3453ca61 100644 --- a/pygtftk/settings.py +++ b/pygtftk/settings.py @@ -26,49 +26,3 @@ def get_completion_script(): prg_list = pygtftk.cmd_manager.CmdManager.cmd_obj_list.keys() prg_str = " ".join(sorted(prg_list)) return COMPLETION_SCRIPT.format(p=prg_str) - - -""" -#--------------------------------------------------------------- -# The list of accepted features -#--------------------------------------------------------------- - -GTF_ACCEPTED_FEATURE_LIST = ["gene", "transcript", "exon", "CDS", - "five_prime_utr", "three_prime_utr", - "start_codon", "stop_codon"] - -GTF_ACCEPTED_FEATURE_CS = ['"{}"'.format(x) for x in GTF_ACCEPTED_FEATURE_LIST] -GTF_ACCEPTED_FEATURE_CS = ",".join(GTF_ACCEPTED_FEATURE_CS) - - -#--------------------------------------------------------------- -# File Format definition (~/.gtftk.ffd) -#--------------------------------------------------------------- - -FILE_FORMAT_DEF = ## gtftk file format definition file -## >format_name file_extension number_of_columns -## COLUMN name type values default_value typed_default_value mandatory -## KEY key source destinations - ->GTF gtf 9 -COLUMN seqid S * "." "." true -COLUMN source S * "." "." true -COLUMN feature S {a} "." "." true -COLUMN start I * "." -1 true -COLUMN end I * "." -1 true -COLUMN score F * "." -1.0 false -COLUMN strand C "+","-" "." "." false -COLUMN phase I 0,1,2 "." -1 false -COLUMN attributes A * "." "." false -KEY attributes("gene_id") feature("gene") feature("transcript"),feature("CDS"),feature("exon"),feature("start_codon"),feature("stop_codon"),feature("five_prime_utr"),feature("three_prime_utr") -KEY attributes("transcript_id") feature("transcript") feature("CDS"),feature("exon"),feature("start_codon"),feature("stop_codon"),feature("five_prime_utr"),feature("three_prime_utr") -KEY attributes("ccds_id") feature("CDS") feature("exon"),feature("start_codon"),feature("stop_codon"),feature("five_prime_utr"),feature("three_prime_utr") - ->GFF3 gff3 9 -COLUMN seqid S * "." true -COLUMN source S * "." true -COLUMN type S * "." true -COLUMN start I * "." true -COLUMN end I * "." true -.format(a=GTF_ACCEPTED_FEATURE_CS) -""" diff --git a/pygtftk/src/libgtftk/command/get_sequences.c b/pygtftk/src/libgtftk/command/get_sequences.c index 92476232..fd6bb345 100644 --- a/pygtftk/src/libgtftk/command/get_sequences.c +++ b/pygtftk/src/libgtftk/command/get_sequences.c @@ -84,7 +84,7 @@ void get_chunk(char *ret, FILE *fasta_file, long seqpos, int L, int N, int p, ch fseek(fasta_file, -1, SEEK_CUR); reste_row_file = L; } - } while (reste_row & !eof); + } while (reste_row && !eof); } } diff --git a/pygtftk/src/libgtftk/config.h b/pygtftk/src/libgtftk/config.h new file mode 100644 index 00000000..11d97a72 --- /dev/null +++ b/pygtftk/src/libgtftk/config.h @@ -0,0 +1,98 @@ +/* config.h. Generated from config.h.in by configure. */ +/* config.h.in. Generated from configure.ac by autoheader. */ + +/* Define to 1 if you have the header file. */ +#define HAVE_DLFCN_H 1 + +/* Define to 1 if you have the header file. */ +#define HAVE_INTTYPES_H 1 + +/* Define to 1 if you have the header file. */ +#define HAVE_LIMITS_H 1 + +/* Define to 1 if your system has a GNU libc compatible `malloc' function, and + to 0 otherwise. */ +#define HAVE_MALLOC 1 + +/* Define to 1 if you have the header file. */ +#define HAVE_MEMORY_H 1 + +/* Define to 1 if you have the `mkdir' function. */ +#define HAVE_MKDIR 1 + +/* Define to 1 if your system has a GNU libc compatible `realloc' function, + and to 0 otherwise. */ +#define HAVE_REALLOC 1 + +/* Define to 1 if you have the header file. */ +#define HAVE_STDINT_H 1 + +/* Define to 1 if you have the header file. */ +#define HAVE_STDLIB_H 1 + +/* Define to 1 if you have the `strchr' function. */ +#define HAVE_STRCHR 1 + +/* Define to 1 if you have the `strdup' function. */ +#define HAVE_STRDUP 1 + +/* Define to 1 if you have the header file. */ +#define HAVE_STRINGS_H 1 + +/* Define to 1 if you have the header file. */ +#define HAVE_STRING_H 1 + +/* Define to 1 if you have the `strrchr' function. */ +#define HAVE_STRRCHR 1 + +/* Define to 1 if you have the `strstr' function. */ +#define HAVE_STRSTR 1 + +/* Define to 1 if you have the header file. */ +#define HAVE_SYS_STAT_H 1 + +/* Define to 1 if you have the header file. */ +#define HAVE_SYS_TYPES_H 1 + +/* Define to 1 if you have the header file. */ +#define HAVE_UNISTD_H 1 + +/* Define to the sub-directory in which libtool stores uninstalled libraries. + */ +#define LT_OBJDIR ".libs/" + +/* Name of package */ +#define PACKAGE "libgtftk" + +/* Define to the address where bug reports for this package should be sent. */ +#define PACKAGE_BUGREPORT "fabrice.lopez@inserm.fr" + +/* Define to the full name of this package. */ +#define PACKAGE_NAME "libgtftk" + +/* Define to the full name and version of this package. */ +#define PACKAGE_STRING "libgtftk 0.9.3" + +/* Define to the one symbol short name of this package. */ +#define PACKAGE_TARNAME "libgtftk" + +/* Define to the home page for this package. */ +#define PACKAGE_URL "" + +/* Define to the version of this package. */ +#define PACKAGE_VERSION "0.9.3" + +/* Define to 1 if you have the ANSI C header files. */ +#define STDC_HEADERS 1 + +/* Version number of package */ +#define VERSION "0.9.3" + +/* Define to rpl_malloc if the replacement function should be used. */ +/* #undef malloc */ + +/* Define to rpl_realloc if the replacement function should be used. */ +/* #undef realloc */ + +/* Define to `unsigned int' if does not define. */ +/* #undef size_t */ diff --git a/pygtftk/utils.py b/pygtftk/utils.py index d6b0c049..fe13bb3b 100644 --- a/pygtftk/utils.py +++ b/pygtftk/utils.py @@ -5,12 +5,16 @@ import datetime import glob +import io import os import random import re import string import sys import time +from builtins import range +from builtins import str +from builtins import zip from collections import defaultdict from distutils.spawn import find_executable from subprocess import PIPE @@ -21,18 +25,6 @@ import pygtftk -# ------------------------------------------------------------------------- -# Python Version -# ------------------------------------------------------------------------- - - -PY3 = sys.version_info[0] == 3 -PY2 = sys.version_info[0] == 2 -if PY3: - from builtins import range - from builtins import str - from builtins import zip - # ------------------------------------------------------------------------- # VARIABLES # ------------------------------------------------------------------------- @@ -60,24 +52,6 @@ TAB = '\t' NEWLINE = '\n' -# R libraries -R_LIB = defaultdict(list) - -# --------------------------------------------------------------- -# Python2/3 compatibility -# --------------------------------------------------------------- - - -try: - basestring -except NameError: - basestring = str - -if PY3: - from io import IOBase - - file = IOBase - # --------------------------------------------------------------- # Error class @@ -305,7 +279,7 @@ def add_prefix_to_file(infile, prefix=None): if prefix is None: return infile - if isinstance(infile, file): + if isinstance(infile, io.IOBase): new_file = infile.name else: new_file = infile @@ -313,7 +287,7 @@ def add_prefix_to_file(infile, prefix=None): new_file = os.path.join(os.path.dirname(new_file), prefix + os.path.basename(new_file)) - if isinstance(infile, file): + if isinstance(infile, io.IOBase): return open(new_file, "w") else: return new_file @@ -438,7 +412,6 @@ def check_file_or_dir_exists(file_or_dir=None): """Check if a file/directory or a list of files/directories exist. Raise error if a file is not found. :param file_or_dir: file object or a list of file object. - :param is_list: Is file_or_dir a list ? :Example: @@ -449,18 +422,17 @@ def check_file_or_dir_exists(file_or_dir=None): """ - test_list = [] - # Convert to a list if not isinstance(file_or_dir, list): file_or_dir = [file_or_dir] # Convert to filename - file_or_dir = [x.name if isinstance(x, file) else x for x in file_or_dir] + file_or_dir = [x.name if isinstance(x, io.IOBase) else x for x in file_or_dir] for file_or_dir_cur in file_or_dir: + if not os.path.exists(file_or_dir_cur): - raise GTFtkError("File not found: " + file_or_dir_cur) + message("File not found: " + file_or_dir_cur, type="ERROR") else: message("Found file " + file_or_dir_cur) @@ -573,27 +545,19 @@ def chrom_info_to_bed_file(chrom_file, chr_list=None): >>> from pygtftk.utils import chrom_info_to_bed_file >>> from pygtftk.utils import get_example_file - >>> from pygtftk.utils import PY3 - >>> from pygtftk.utils import PY2 >>> from pybedtools import BedTool >>> a = get_example_file(ext='chromInfo') >>> b = chrom_info_to_bed_file(open(a[0], 'r')) >>> c = BedTool(b.name) >>> d = c.__iter__() >>> i = next(d) - >>> if PY2: assert str(i.chrom) == 'chr2' - >>> if PY2: assert i.start == 0 - >>> if PY2: assert i.end == 600 - >>> if PY3: assert str(i.chrom) == 'chr1' - >>> if PY3: assert i.start == 0 - >>> if PY3: assert i.end == 300 + >>> assert str(i.chrom) == 'chr1' + >>> assert i.start == 0 + >>> assert i.end == 300 >>> i = next(d) - >>> if PY3: assert str(i.chrom) == 'chr2' - >>> if PY3: assert i.start == 0 - >>> if PY3: assert i.end == 600 - >>> if PY2: assert str(i.chrom) == 'chr1' - >>> if PY2: assert i.start == 0 - >>> if PY2: assert i.end == 300 + >>> assert str(i.chrom) == 'chr2' + >>> assert i.start == 0 + >>> assert i.end == 600 """ message("Converting chrom info to bed format") @@ -719,7 +683,7 @@ def silentremove(filename): >>> assert not os.path.exists(a.name) """ - if isinstance(filename, file): + if isinstance(filename, io.IOBase): filename = filename.name try: @@ -741,7 +705,12 @@ def message(msg, nl=True, type="INFO", force=False): """ now = datetime.datetime.now() - ho_min = str(now.hour) + ":" + str(now.minute).zfill(2) + + if pygtftk.utils.VERBOSITY > 2: + ho_min = str(now.hour) + ":" + str(now.minute).zfill(2) + ":" + str(now.second).zfill(2) + else: + ho_min = str(now.hour) + ":" + str(now.minute).zfill(2) + do_it = False if type not in ["INFO", "ERROR", "WARNING", "DEBUG", "DEBUG_MEM"]: @@ -831,22 +800,6 @@ def message(msg, nl=True, type="INFO", force=False): pygtftk.utils.VERBOSITY = VERBOSITY_BACK -# --------------------------------------------------------------- -# Line type -# --------------------------------------------------------------- - -def add_r_lib(cmd=None, libs=None): - """Declare a new set of required R libraries. - - :param libs: Comma separated list of R libraries. - :param cmd: The target command. - - """ - - for lib in libs.split(","): - R_LIB[cmd] += [lib] - - # --------------------------------------------------------------- # Line type # --------------------------------------------------------------- @@ -924,7 +877,7 @@ def to_alphanum(string): are found at the beginning or end of the string, they are deleted. :param string: A character string in which non alphanumeric char have to be replaced. - :param replacement_list: + :Example : @@ -956,7 +909,7 @@ def left_strip_str(string): for pos, line in enumerate(string.split("\n")): if line == "": - if new_line == []: + if not new_line: continue line = " " + re.sub("^\s+", "", line) new_line += [line.lstrip("\n")] @@ -968,11 +921,19 @@ def left_strip_str(string): # Lists and dicts # --------------------------------------------------------------- +def nested_dict(n, type): + """"http://stackoverflow.com/questions/29348345""" + if n == 1: + return defaultdict(type) + else: + return defaultdict(lambda: nested_dict(n - 1, type)) -def flatten_list(x, outlist=[]): + +def flatten_list(x, outlist=None): """Flatten a list of lists. :param x: a list or list of list. + :param outlist: The output list. :Example: @@ -988,6 +949,9 @@ def flatten_list(x, outlist=[]): """ + if outlist is None: + outlist = [] + if not isinstance(x, (list, tuple)): outlist += [x] else: @@ -1004,16 +968,16 @@ def flatten_list_recur(a_list, sep=" "): """ - def _iterFlatten(root): + def _iter_flatten(root): if isinstance(root, (list, tuple)): for element in root: - for e in _iterFlatten(element): + for e in _iter_flatten(element): yield e else: yield root - return sep.join(list(_iterFlatten(a_list))) + return sep.join(list(_iter_flatten(a_list))) def sort_2_lists(list1, list2): @@ -1047,7 +1011,10 @@ def print_table(table): for i, x in enumerate(line)) + " |") -def call_nested_dict_from_list(data, args=[]): +def call_nested_dict_from_list(data, args=None): + if args is None: + args = [] + if args and data: element = args[0] if element: @@ -1174,3 +1141,25 @@ def check_r_packages(r_pkg_list=None, no_error=True): type="ERROR") return False return True + + +# --------------------------------------------------------------- +# COLORS +# --------------------------------------------------------------- + + +ALL_MPL_PALETTES = ['viridis', 'plasma', 'inferno', 'magma', + 'Greys', 'Purples', 'Blues', 'Greens', 'Oranges', 'Reds', + 'YlOrBr', 'YlOrRd', 'OrRd', 'PuRd', 'RdPu', 'BuPu', + 'GnBu', 'PuBu', 'YlGnBu', 'PuBuGn', 'BuGn', 'YlGn', + 'binary', 'gist_yarg', 'gist_gray', 'gray', 'bone', 'pink', + 'spring', 'summer', 'autumn', 'winter', 'cool', 'Wistia', + 'hot', 'afmhot', 'gist_heat', 'copper', + 'PiYG', 'PRGn', 'BrBG', 'PuOr', 'RdGy', 'RdBu', + 'RdYlBu', 'RdYlGn', 'Spectral', 'coolwarm', 'bwr', 'seismic', + 'Pastel1', 'Pastel2', 'Paired', 'Accent', + 'Dark2', 'Set1', 'Set2', 'Set3', + 'tab10', 'tab20', 'tab20b', 'tab20c', + 'flag', 'prism', 'ocean', 'gist_earth', 'terrain', 'gist_stern', + 'gnuplot', 'gnuplot2', 'CMRmap', 'cubehelix', 'brg', 'hsv', + 'gist_rainbow', 'rainbow', 'jet', 'nipy_spectral', 'gist_ncar'] diff --git a/pygtftk/version.py b/pygtftk/version.py index 662ca3ac..a19242b5 100644 --- a/pygtftk/version.py +++ b/pygtftk/version.py @@ -1,2 +1,2 @@ -__base_version__='0.9.8' -__version__='0.9.8' +__base_version__='0.9.9' +__version__='0.9.9' diff --git a/requirements.txt b/requirements.txt index e6f8580a..ffae6aa0 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,4 +1,5 @@ scipy >=1.1.0 +numpy >=1.15.3 pybedtools >=0.7.8 pyyaml >=3.12 requests >=2.13.0 diff --git a/setup.cfg b/setup.cfg index eff29e6e..b54fe92a 100644 --- a/setup.cfg +++ b/setup.cfg @@ -1,6 +1,6 @@ [metadata] name = pygtftk -version = 0.9.8 +version = 0.9.9 author = D. Puthier and F. Lopez author-email = denis.puthier@univ-amu.fr diff --git a/setup.py b/setup.py index 04133d88..8d4746d7 100644 --- a/setup.py +++ b/setup.py @@ -34,7 +34,6 @@ # ------------------------------------------------------------------------- -PY3 = sys.version_info[0] == 3 PY2 = sys.version_info[0] == 2 if PY2: @@ -221,7 +220,9 @@ 'pygtftk/data/simple_03', 'pygtftk/data/simple_04', 'pygtftk/data/simple_05', + 'pygtftk/data/simple_06', 'pygtftk/data/mini_real', + 'pygtftk/data/mini_real_10M', 'pygtftk/data/mini_real_noov_rnd_tx', 'pygtftk/data/control_list', 'pygtftk/src/', @@ -233,7 +234,9 @@ 'pygtftk/data/simple_03': ['*.*'], 'pygtftk/data/simple_04': ['*.*'], 'pygtftk/data/simple_05': ['*.*'], + 'pygtftk/data/simple_06': ['*.*'], 'pygtftk/data/mini_real': ['*.*'], + 'pygtftk/data/mini_real_10M': ['*.*'], 'pygtftk/data/mini_real_noov_rnd_tx': ['*.*'], 'pygtftk/data/control_list': ['*.*'], 'pygtftk/plugins': ['*.*'], @@ -248,10 +251,9 @@ classifiers=__classifiers__, long_description=long_description, extras_require={ - 'tests': [ + 'dev': [ 'nose', - 'pycodestyle >= 2.1.0'], - 'docs': [ + 'pycodestyle >= 2.1.0', 'sphinx >=1.5.2', 'sphinxcontrib-programoutput >=0.8', 'sphinx_bootstrap_theme >=0.4.9']}, diff --git a/tools/README b/tools/README new file mode 100644 index 00000000..21160737 --- /dev/null +++ b/tools/README @@ -0,0 +1 @@ +These are internal tools that are not supported. \ No newline at end of file diff --git a/tools/fasta/del_dup_ids_fasta.py b/tools/fasta/del_dup_ids_fasta.py new file mode 100644 index 00000000..b4018681 --- /dev/null +++ b/tools/fasta/del_dup_ids_fasta.py @@ -0,0 +1,54 @@ +#!/usr/bin/env python + +import sys +import argparse +from Bio import SeqIO + +__DESC__ = '''If several records share the same ID, print the first encountered, irrespective of the sequence.''' + +def make_parser(): + """The program parser.""" + parser = argparse.ArgumentParser(add_help=True, + description=__DESC__) + + parser_grp = parser.add_argument_group('Arguments') + + parser_grp.add_argument('-i', '--inputfile', + help="Path to the FASTA file. Default to STDIN", + default=sys.stdin, + metavar="FASTA", + type=argparse.FileType('r')) + + parser_grp.add_argument('-o', '--outputfile', + help="Path to the output FASTA file. Default to STDOUT", + default=sys.stdout, + metavar="FASTA", + type=argparse.FileType('w')) + + + return parser + +def get_seq_from_ids(inputfile=None, + outputfile=None): + + + id_printed = set() + + with inputfile as handle: + for rec in SeqIO.parse(handle, "fasta"): + if rec.id not in id_printed: + outputfile.write(">" + rec.id + "\n") + outputfile.write(str(rec.seq) + "\n") + id_printed.add(rec.id) + + +def main(): + """The main function.""" + myparser = make_parser() + args = myparser.parse_args() + args = dict(args.__dict__) + get_seq_from_ids(**args) + + +if __name__ == '__main__': + main() diff --git a/tools/fasta/diff_fasta.py b/tools/fasta/diff_fasta.py new file mode 100644 index 00000000..1887decd --- /dev/null +++ b/tools/fasta/diff_fasta.py @@ -0,0 +1,65 @@ +#!/usr/bin/env python + +import argparse +import sys + +from Bio import SeqIO + +__DESC__ = ''' Compare sequences from two fasta files with records ordered in the same way.''' + + +def make_parser(): + """The program parser.""" + parser = argparse.ArgumentParser(add_help=True, description=__DESC__) + + parser_grp = parser.add_argument_group('Arguments') + + parser_grp.add_argument('-1', '--inputfile-1', + help="Path to the FASTA file.", + default=None, + metavar="FASTA", + type=argparse.FileType('r'), + required=True) + + parser_grp.add_argument('-2', '--inputfile-2', + help="Path to the FASTA file.", + default=None, + metavar="FASTA", + type=argparse.FileType('r'), + required=True) + + parser_grp.add_argument('-o', '--outputfile', + help="Path to the output FASTA file. Default to STDOUT", + default=sys.stdout, + metavar="FASTA", + type=argparse.FileType('w')) + + return parser + + +def get_seq_from_ids(inputfile_1=None, + inputfile_2=None, + outputfile=None): + record_dict_1 = SeqIO.to_dict(SeqIO.parse(inputfile_1.name, "fasta")) + record_dict_2 = SeqIO.to_dict(SeqIO.parse(inputfile_2.name, "fasta")) + + all_key = list(set(list(record_dict_1.keys()) + list(record_dict_2.keys()))) + for i in all_key: + if record_dict_1[i].seq != record_dict_2[i].seq: + outputfile.write("-- " + i + " has not the same sequence in both files...\n") + outputfile.write("->" + record_dict_1[i].seq + "\n") + outputfile.write("->" + record_dict_2[i].seq + "\n") + else: + outputfile.write("-- " + i + " has same sequence\n") + + +def main(): + """The main function.""" + myparser = make_parser() + args = myparser.parse_args() + args = dict(args.__dict__) + get_seq_from_ids(**args) + + +if __name__ == '__main__': + main() diff --git a/tools/fasta/order_fasta.py b/tools/fasta/order_fasta.py new file mode 100644 index 00000000..fda69d76 --- /dev/null +++ b/tools/fasta/order_fasta.py @@ -0,0 +1,62 @@ +#!/usr/bin/env python + +import sys +import argparse +from Bio import SeqIO +from Bio.SeqIO import FastaIO + +__DESC__ = '''Take a FASTA as input and produced a new FASTA file with record +ordered as in --id-file.''' + +def make_parser(): + """The program parser.""" + parser = argparse.ArgumentParser(add_help=True, description=__DESC__) + + parser_grp = parser.add_argument_group('Arguments') + + parser_grp.add_argument('-i', '--inputfile', + help="Path to the FASTA file. Default to STDIN", + default=sys.stdin, + metavar="FASTA", + type=argparse.FileType('r')) + + parser_grp.add_argument('-o', '--outputfile', + help="Path to the output FASTA file. Default to STDOUT", + default=sys.stdout, + metavar="FASTA", + type=argparse.FileType('w')) + + parser_grp.add_argument('-f', '--id-file', + help="The file containing the IDS to be extracted.", + default=None, + metavar="FASTA", + type=argparse.FileType('r'), + required=True) + + return parser + +def get_seq_from_ids(inputfile=None, + outputfile=None, + id_file=None): + + id_list = id_file.readlines() + id_list = [x.replace(">","").rstrip("\n") for x in id_list] + + record_dict = SeqIO.to_dict(SeqIO.parse(inputfile.name, "fasta")) + + fasta_out = FastaIO.FastaWriter(outputfile, wrap=None) + + for i in id_list: + print(">" + record_dict[i].id) + print(record_dict[i].seq) + +def main(): + """The main function.""" + myparser = make_parser() + args = myparser.parse_args() + args = dict(args.__dict__) + get_seq_from_ids(**args) + + +if __name__ == '__main__': + main() diff --git a/tools/fasta/unfold_fasta.py b/tools/fasta/unfold_fasta.py new file mode 100644 index 00000000..29253cac --- /dev/null +++ b/tools/fasta/unfold_fasta.py @@ -0,0 +1,48 @@ +#!/usr/bin/env python + +import argparse +import sys + +from Bio import SeqIO + +__DESC__ = '''Take a FASTA as input and produced a new FASTA file with record +ordered as in --id-file.''' + + +def make_parser(): + """The program parser.""" + parser = argparse.ArgumentParser(add_help=True, description=__DESC__) + + parser_grp = parser.add_argument_group('Arguments') + + parser_grp.add_argument('-i', '--inputfile', + help="Path to the FASTA file. Default to STDIN", + default=sys.stdin, + metavar="FASTA", + type=argparse.FileType('r')) + + parser_grp.add_argument('-o', '--outputfile', + help="Path to the output FASTA file. Default to STDOUT", + default=sys.stdout, + metavar="FASTA", + type=argparse.FileType('w')) + + return parser + + +def unfold(inputfile=None, + outputfile=None): + for rec in SeqIO.parse(inputfile.name, "fasta"): + SeqIO.write(rec, outputfile, "fasta-2line") + + +def main(): + """The main function.""" + myparser = make_parser() + args = myparser.parse_args() + args = dict(args.__dict__) + unfold(**args) + + +if __name__ == '__main__': + main()