Gentoo Archives: gentoo-commits

From: Martin Mokrejs <mmokrejs@×××××××××××××××.cz>
To: gentoo-commits@l.g.o
Subject: [gentoo-commits] proj/sci:master commit in: sci-biology/transdecoder/files/, sci-biology/transdecoder/
Date: Thu, 30 Apr 2015 22:51:21
Message-Id: 1430434236.e667e2f550d570e61afc091a751729fb166d1913.mmokrejs@gentoo
1 commit: e667e2f550d570e61afc091a751729fb166d1913
2 Author: Martin Mokrejš <mmokrejs <AT> fold <DOT> natur <DOT> cuni <DOT> cz>
3 AuthorDate: Thu Apr 30 22:50:36 2015 +0000
4 Commit: Martin Mokrejs <mmokrejs <AT> fold <DOT> natur <DOT> cuni <DOT> cz>
5 CommitDate: Thu Apr 30 22:50:36 2015 +0000
6 URL: https://gitweb.gentoo.org/proj/sci.git/commit/?id=e667e2f5
7
8 sci-biology/TransDecoder: renamed package to keep original letter-casing
9
10 sci-biology/transdecoder/ChangeLog | 54 --------
11 sci-biology/transdecoder/files/TransDecoder.patch | 136 ---------------------
12 .../transdecoder/files/pfam_runner.pl.patch | 20 ---
13 sci-biology/transdecoder/metadata.xml | 9 --
14 sci-biology/transdecoder/transdecoder-2.0.1.ebuild | 69 -----------
15 5 files changed, 288 deletions(-)
16
17 diff --git a/sci-biology/transdecoder/ChangeLog b/sci-biology/transdecoder/ChangeLog
18 deleted file mode 100644
19 index 6fd8f5c..0000000
20 --- a/sci-biology/transdecoder/ChangeLog
21 +++ /dev/null
22 @@ -1,54 +0,0 @@
23 -# ChangeLog for sci-biology/transdecoder
24 -# Copyright 1999-2015 Gentoo Foundation; Distributed under the GPL v2
25 -# $Header: $
26 -
27 - 27 Apr 2015; Martin Mokrejs <mmokrejs@×××××××××××××××.cz>
28 - transdecoder-2.0.1.ebuild:
29 - sci-biology/transdecoder: more ebuild cleanup
30 -
31 - 27 Apr 2015; Martin Mokrejs <mmokrejs@×××××××××××××××.cz>
32 - transdecoder-2.0.1.ebuild:
33 - sci-biology/transdecoder: ebuild cleanup
34 -
35 - 27 Apr 2015; Martin Mokrejs <mmokrejs@×××××××××××××××.cz>
36 - -transdecoder-20140704.ebuild, transdecoder-2.0.1.ebuild:
37 - sci-biology/transdecoder: drop old
38 -
39 - 17 Apr 2015; Martin Mokrejs <mmokrejs@×××××××××××××××.cz>
40 - transdecoder-2.0.1.ebuild, transdecoder-20140704.ebuild:
41 - sci-biology/transdecoder: fixed installation of perl-related files
42 -
43 - 19 Mar 2015; Martin Mokrejs <mmokrejs@×××××××××××××××.cz>
44 - transdecoder-2.0.1.ebuild:
45 - dropped hmmer dependency altogether, added pkg_postinst() with
46 - usage/dependency info
47 -
48 -*transdecoder-2.0.1 (19 Mar 2015)
49 -
50 - 19 Mar 2015; Martin Mokrejs <mmokrejs@×××××××××××××××.cz>
51 - +transdecoder-2.0.1.ebuild, transdecoder-20140704.ebuild:
52 - removing KEYWORDS until the perl files are installed to some other place. At
53 - the moment I get: 'perl-module.eclass: Suspicious environment values found.
54 - PERL5LIB="/usr/lib64/perl5/vendor_perl/5.18.2/TransDecoder"'
55 -
56 - 15 Feb 2015; Martin Mokrejs <mmokrejs@×××××××××××××××.cz>
57 - transdecoder-20140704.ebuild:
58 - drop hmmer-3 dependency, it is an optional dependency only
59 -
60 - 10 Jan 2015; Martin Mokrejs <mmokrejs@×××××××××××××××.cz>
61 - transdecoder-20140704.ebuild:
62 - install *.pm into PERL5LIB/TransDecoder and pass that via env.d
63 -
64 - 09 Jan 2015; Martin Mokrejs <mmokrejs@×××××××××××××××.cz>
65 - +files/TransDecoder.patch, +files/pfam_runner.pl.patch,
66 - transdecoder-20140704.ebuild:
67 - sci-biology/transdecoder: added patches so that we use PATH to loclate
68 - binaries and not in a local subdirectory named 'util', drop sys-
69 - cluster/openmpi requirement, it does not link against it all all, this is a
70 - bunch of perl and shell scripts
71 -
72 -*transdecoder-20140704 (08 Jan 2015)
73 -
74 - 08 Jan 2015; Martin Mokrejs <mmokrejs@×××××××××××××××.cz> +metadata.xml,
75 - +transdecoder-20140704.ebuild:
76 - sci-biology/transdecoder: new package
77
78 diff --git a/sci-biology/transdecoder/files/TransDecoder.patch b/sci-biology/transdecoder/files/TransDecoder.patch
79 deleted file mode 100644
80 index c0cff94..0000000
81 --- a/sci-biology/transdecoder/files/TransDecoder.patch
82 +++ /dev/null
83 @@ -1,136 +0,0 @@
84 ---- /usr/bin/TransDecoder 2015-01-09 11:22:55.000000000 +0100
85 -+++ TransDecoder 2015-01-09 14:31:44.095839522 +0100
86 -@@ -48,7 +48,7 @@
87 - --prepare_pfam Prepare data for PFAM search and then quit (for running PFAM on HPC/computing cluster
88 - with or without MPI )
89 -
90 -- --CPU <int> number of threads to use; (default: 2)
91 -+ --CPU <int> number of threads to use; (default: 1)
92 -
93 - --MPI use MPI w/ execution of hmmscan
94 -
95 -@@ -76,7 +76,7 @@
96 -
97 - =head1 PFAM
98 -
99 --You will need hmmer installed. Use hmmpress to prepare the database for hmmer.
100 -+You will need hmmer installed. Use hmmpress from >=hmmer-3.0 to prepare the database for hmmer.
101 - L<See|https://sourceforge.net/projects/transdecoder/files/Pfam-AB.hmm.bin> for downloading the database.
102 -
103 - =head1 CD-HIT
104 -@@ -105,7 +105,6 @@
105 - use Longest_orf;
106 -
107 - my $UTIL_DIR = "$FindBin::RealBin/util";
108 --$ENV{PATH} = "$UTIL_DIR/bin:$ENV{PATH}";
109 - $ENV{LD_LIBRARY_PATH} .= ":$FindBin::RealBin/util/lib64";
110 -
111 - my ($cd_hit_est_exec) = &check_program('cd-hit-est');
112 -@@ -124,7 +123,7 @@
113 - my $verbose;
114 - my $search_pfam = "";
115 - my ($reuse,$pfam_out);
116 --my $CPU = 2;
117 -+my $CPU = 1;
118 - my $RETAIN_LONG_ORFS = 900;
119 - my $MPI = 0;
120 -
121 -@@ -330,15 +329,15 @@
122 - my $top_cds_file = $train_file && -s $train_file ? $train_file : "$cds_file.top_${top_ORFs_train}_longest";
123 - if (!-s $top_cds_file) {
124 - # get longest entries
125 -- my $cmd = "$UTIL_DIR/get_top_longest_fasta_entries.pl $cds_file $top_ORFs_train > $top_cds_file";
126 -+ my $cmd = "get_top_longest_fasta_entries.pl $cds_file $top_ORFs_train > $top_cds_file";
127 -
128 - unless ($reuse && -s $top_cds_file){
129 - if ($cd_hit_est_exec){
130 - # to speed things up only check for redundancy up to 4x the number of entries we want
131 - my $red_num = $top_ORFs_train * 4 ;
132 -- &process_cmd("$UTIL_DIR/get_top_longest_fasta_entries.pl $cds_file $red_num > $workdir/redundant_top");
133 -+ &process_cmd("get_top_longest_fasta_entries.pl $cds_file $red_num > $workdir/redundant_top");
134 - &process_cmd("$cd_hit_est_exec -r 1 -i $workdir/redundant_top -o $workdir/redundant_top.nr90 -M 0 -T $CPU >/dev/null 2>/dev/null");
135 -- &process_cmd("$UTIL_DIR/get_top_longest_fasta_entries.pl $workdir/redundant_top.nr90 $top_ORFs_train > $top_cds_file");
136 -+ &process_cmd("get_top_longest_fasta_entries.pl $workdir/redundant_top.nr90 $top_ORFs_train > $top_cds_file");
137 - unlink("$workdir/redundant_top");
138 - unlink("$workdir/redundant_top.nr90");
139 - unlink("$workdir/redundant_top.nr90.bak.clstr");
140 -@@ -349,20 +348,20 @@
141 - }
142 - }
143 -
144 --$cmd = "$UTIL_DIR/compute_base_probs.pl $transcripts_file $TOP_STRAND_ONLY > $workdir/base_freqs.dat";
145 -+$cmd = "compute_base_probs.pl $transcripts_file $TOP_STRAND_ONLY > $workdir/base_freqs.dat";
146 - &process_cmd($cmd) unless $reuse && -s "$workdir/base_freqs.dat";
147 -
148 -
149 - # get hexamer scores
150 --#$cmd = "$UTIL_DIR/seq_n_background_to_logliklihood_vals.pl $top_cds_file $transcripts_file.random > hexamer.scores";
151 -+#$cmd = "seq_n_background_to_logliklihood_vals.pl $top_cds_file $transcripts_file.random > hexamer.scores";
152 - #&process_cmd($cmd) unless ($reuse && -s "hexamer.scores");
153 -
154 --$cmd = "$UTIL_DIR/seq_n_baseprobs_to_logliklihood_vals.pl $top_cds_file $workdir/base_freqs.dat > $workdir/hexamer.scores";
155 -+$cmd = "seq_n_baseprobs_to_logliklihood_vals.pl $top_cds_file $workdir/base_freqs.dat > $workdir/hexamer.scores";
156 - &process_cmd($cmd) unless $reuse && -s "$workdir/hexamer.scores";
157 -
158 -
159 - # score all cds entries
160 --$cmd = "$UTIL_DIR/score_CDS_liklihood_all_6_frames.pl $cds_file $workdir/hexamer.scores > $cds_file.scores";
161 -+$cmd = "score_CDS_liklihood_all_6_frames.pl $cds_file $workdir/hexamer.scores > $cds_file.scores";
162 - &process_cmd($cmd) unless ($reuse && -s "$cds_file.scores");
163 -
164 -
165 -@@ -440,18 +439,18 @@
166 - }
167 -
168 - # index the current gff file:
169 --$cmd = "$UTIL_DIR/index_gff3_files_by_isoform.pl $gff3_file";
170 -+$cmd = "index_gff3_files_by_isoform.pl $gff3_file";
171 - &process_cmd($cmd);
172 -
173 - # retrieve the best entries:
174 --$cmd = "$UTIL_DIR/gene_list_to_gff.pl $acc_file $gff3_file.inx > $cds_file.best_candidates.gff3";
175 -+$cmd = "gene_list_to_gff.pl $acc_file $gff3_file.inx > $cds_file.best_candidates.gff3";
176 - &process_cmd($cmd);
177 -
178 - {
179 - my $final_output_prefix = basename($transcripts_file) . ".transdecoder";
180 -
181 - # exclude shadow orfs (smaller orfs in different reading frame that are eclipsed by longer orfs)
182 -- $cmd = "$UTIL_DIR/remove_eclipsed_ORFs.pl $cds_file.best_candidates.gff3 > $final_output_prefix.gff3";
183 -+ $cmd = "remove_eclipsed_ORFs.pl $cds_file.best_candidates.gff3 > $final_output_prefix.gff3";
184 - &process_cmd($cmd);
185 -
186 -
187 -@@ -462,14 +461,14 @@
188 - my $gff3_file = "$final_output_prefix.gff3";
189 - my $bed_file = $gff3_file;
190 - $bed_file =~ s/\.gff3$/\.bed/;
191 -- $cmd = "$UTIL_DIR/gff3_file_to_bed.pl $gff3_file > $bed_file";
192 -+ $cmd = "gff3_file_to_bed.pl $gff3_file > $bed_file";
193 - &process_cmd($cmd);
194 -
195 -
196 - # make a peptide file:
197 - my $best_pep_file = $gff3_file;
198 - $best_pep_file =~ s/\.gff3$/\.pep/;
199 -- $cmd = "$UTIL_DIR/gff3_file_to_proteins.pl $gff3_file $transcripts_file > $best_pep_file";
200 -+ $cmd = "gff3_file_to_proteins.pl $gff3_file $transcripts_file > $best_pep_file";
201 - &process_cmd($cmd);
202 -
203 -
204 -@@ -477,13 +476,13 @@
205 - # make a CDS file:
206 - my $best_cds_file = $best_pep_file;
207 - $best_cds_file =~ s/\.pep$/\.cds/;
208 -- $cmd = "$UTIL_DIR/gff3_file_to_proteins.pl $gff3_file $transcripts_file CDS > $best_cds_file";
209 -+ $cmd = "gff3_file_to_proteins.pl $gff3_file $transcripts_file CDS > $best_cds_file";
210 - &process_cmd($cmd);
211 -
212 - # make a CDS file:
213 - my $best_cdna_file = $best_pep_file;
214 - $best_cdna_file =~ s/\.pep$/\.mRNA/;
215 -- $cmd = "$UTIL_DIR/gff3_file_to_proteins.pl $gff3_file $transcripts_file cDNA > $best_cdna_file";
216 -+ $cmd = "gff3_file_to_proteins.pl $gff3_file $transcripts_file cDNA > $best_cdna_file";
217 - &process_cmd($cmd);
218 -
219 - }
220
221 diff --git a/sci-biology/transdecoder/files/pfam_runner.pl.patch b/sci-biology/transdecoder/files/pfam_runner.pl.patch
222 deleted file mode 100644
223 index 7809b1a..0000000
224 --- a/sci-biology/transdecoder/files/pfam_runner.pl.patch
225 +++ /dev/null
226 @@ -1,20 +0,0 @@
227 ---- /usr/bin/pfam_runner.pl 2015-01-09 11:22:55.000000000 +0100
228 -+++ pfam_runner.pl 2015-01-09 14:25:43.385838579 +0100
229 -@@ -24,7 +24,7 @@
230 - my $workdir;
231 - my $verbose;
232 - my ($reuse,$pfam_out);
233 --my $CPU = 2;
234 -+my $CPU = 1;
235 -
236 - my $usage = <<_EOH_;
237 -
238 -@@ -59,7 +59,7 @@
239 - # -h print this option menu and quit
240 - # -v verbose
241 - #
242 --# --CPU <int> number of threads to use; (default: 2)
243 -+# --CPU <int> number of threads to use; (default: 1)
244 - #
245 - # --MPI use MPI (via ffindex_apply_mpi)
246 - #
247
248 diff --git a/sci-biology/transdecoder/metadata.xml b/sci-biology/transdecoder/metadata.xml
249 deleted file mode 100644
250 index 2bc8930..0000000
251 --- a/sci-biology/transdecoder/metadata.xml
252 +++ /dev/null
253 @@ -1,9 +0,0 @@
254 -<?xml version="1.0" encoding="UTF-8"?>
255 -<!DOCTYPE pkgmetadata SYSTEM "http://www.gentoo.org/dtd/metadata.dtd">
256 -<pkgmetadata>
257 - <herd>sci-biology</herd>
258 - <maintainer>
259 - <email>mmokrejs@×××××××××××××××.cz</email>
260 - <name>Martin Mokrejs</name>
261 - </maintainer>
262 -</pkgmetadata>
263
264 diff --git a/sci-biology/transdecoder/transdecoder-2.0.1.ebuild b/sci-biology/transdecoder/transdecoder-2.0.1.ebuild
265 deleted file mode 100644
266 index e8f5134..0000000
267 --- a/sci-biology/transdecoder/transdecoder-2.0.1.ebuild
268 +++ /dev/null
269 @@ -1,69 +0,0 @@
270 -# Copyright 1999-2015 Gentoo Foundation
271 -# Distributed under the terms of the GNU General Public License v2
272 -# $Header: $
273 -
274 -EAPI=5
275 -
276 -PERL_EXPORT_PHASE_FUNCTIONS=no
277 -inherit perl-module eutils toolchain-funcs
278 -
279 -DESCRIPTION="Extract ORF/CDS regions from FASTA sequences"
280 -HOMEPAGE="http://sourceforge.net/projects/transdecoder/"
281 -SRC_URI="https://github.com/TransDecoder/TransDecoder/archive/"${PV}".tar.gz -> ${P}.tar.gz"
282 -
283 -LICENSE="BSD-BroadInstitute"
284 -SLOT="0"
285 -KEYWORDS="~amd64"
286 -IUSE=""
287 -
288 -DEPEND=""
289 -RDEPEND="${DEPEND}
290 - sci-biology/cd-hit
291 - sci-biology/hmmer
292 - sci-biology/parafly
293 - sci-biology/ffindex"
294 -# cdhit-4.6.1 is a real dependency, at least hmmer is optional (also ncbi-tools++ is now used for ORF searches)
295 -
296 -S="${WORKDIR}"/TransDecoder-2.0.1
297 -
298 -##src_prepare(){
299 -# #mv Makefile Makefile.old
300 -# #epatch "${FILESDIR}"/TransDecoder.patch
301 -# #epatch "${FILESDIR}"/pfam_runner.pl.patch
302 -#}
303 -
304 -# avoid fetching 1.5TB "${S}"/pfam/Pfam-AB.hmm.bin, see
305 -# "Re: [Transdecoder-users] Announcement: Transdecoder release r20140704" thread in archives
306 -#
307 -# you cna get it from http://downloads.sourceforge.net/project/transdecoder/Pfam-AB.hmm.bin
308 -
309 -src_install(){
310 - dobin TransDecoder.Predict TransDecoder.LongOrfs
311 - insinto /usr/share/${PN}/util
312 - dobin util/*.pl
313 - # zap the bundled cdhit binaries copied from transdecoder_plugins/cdhit/ to util/bin
314 - rm -rf util/bin
315 - #
316 - # * sci-biology/trinityrnaseq-20140413:0::science
317 - # * /usr/bin/Fasta_reader.pm
318 - # * /usr/bin/GFF3_utils.pm
319 - # * /usr/bin/Gene_obj.pm
320 - # * /usr/bin/Gene_obj_indexer.pm
321 - # * /usr/bin/Longest_orf.pm
322 - # * /usr/bin/Nuc_translator.pm
323 - # * /usr/bin/TiedHash.pm
324 - #
325 - perl_set_version
326 - insinto ${VENDOR_LIB}/${PN}
327 - dobin PerlLib/*.pm # BUG: install into /usr/bin but wanted to have it readable and executable in ${VENDOR_LIB}/${PN} instead
328 - einfo "Fetch on your own:"
329 - einfo "wget --mirror -nH -nd http://downloads.sourceforge.net/project/transdecoder/Pfam-AB.hmm.bin"
330 - einfo "hmmpress Pfam-AB.hmm.bin"
331 -}
332 -
333 -pkg_postinst(){
334 - einfo "It is recommended to use TransDecoder with hmmer-3 or at least NCBI blast"
335 - einfo "from either sci-biology/ncbi-blast+ (released more often) or"
336 - einfo "from sci-biology/ncbi-toolkit++ (huge bundle with releases and less frequent bugfixes)"
337 - einfo "Author says the minimum requirement is sci-biology/cd-hit"
338 -}