iracooke · September 20, 2015 23:53
diff --git a/README.md b/README.md
diff --git a/filter_fasta.rb b/filter_fasta.rb
 #!/usr/bin/env ruby
 #

 require 'set'
 require 'bio'

 fasta_file=ARGV[0]

 output_fh = $stdout

 id_filter=ARGV[1]

 $filter_ids = Set.new()
 $filter_ids = File.readlines(id_filter).collect { |e| e.chomp }

 def passes_filters(entry)

 	if $filter_ids.length > 0
 		# require 'byebug';byebug
 		if $filter_ids.include? entry.entry_id
 			return true
 		end
 		return false
 	end

 	return true

 end


 file = Bio::FastaFormat.open(fasta_file.chomp)
 file.each do |entry|
 	pass = passes_filters(entry)
 	if pass
 		output_fh.write entry
 	end
 end
File	Description
`observed_peptides.gff`	Output from the Galaxy workflow above
`transdecoder.gff3`	GFF coordinates for transdecoder predictions (used as an input to the Galaxy workflow above)
`known.fasta`	Output from database generation workflow above
`novel.fasta`	Output from the database generation workflow above
`crap.fasta`	The cRAP contaminants. Download
	#!/usr/bin/env ruby
	#

	require 'set'
	require 'bio'

	fasta_file=ARGV[0]

	output_fh = $stdout

	id_filter=ARGV[1]

	$filter_ids = Set.new()
	$filter_ids = File.readlines(id_filter).collect { \|e\| e.chomp }

	def passes_filters(entry)

	if $filter_ids.length > 0
	# require 'byebug';byebug
	if $filter_ids.include? entry.entry_id
	return true
	end
	return false
	end

	return true

	end


	file = Bio::FastaFormat.open(fasta_file.chomp)
	file.each do \|entry\|
	pass = passes_filters(entry)
	if pass
	output_fh.write entry
	end
	end