require 'rubygems'
require 'bio'
 
#############

# Reads in a ClustalW formatted multiple sequence alignment
# from a file named "infile_clustalw.aln" and stores it in 'report'.
report = Bio::ClustalW::Report.new(File.read('infile_clustalw.aln'))

# Accesses the actual alignment.
msa = report.alignment

# Goes through all sequences in 'msa' and prints the
# actual molecular sequence.
msa.each do |entry|
  puts entry.seq
end

##############

DEFAULT_PARSER = Bio::Alignment::MultiFastaFormat
puts DEFAULT_PARSER.to_s

#file = Bio::Alignment.readfiles('bcl2.fasta', Bio::Alignment::MultiFastaFormat)
#file.each do |entry|
#  puts entry.entry_id           # Gets the identifier, e.g. 'sp|O35147|BAD_RAT'.
#  puts entry.definition         # Gets the complete fasta description line.
#  puts entry.seq                # Gets the actual sequence.
  #puts entry.aaseq.composition  # Gets the amino acid composition.
#end
#puts 'OK'
#puts

file = Bio::FastaFormat.open('bcl2.fasta')
file.each do |entry|
   puts entry.entry_id           # Gets the identifier, e.g. 'sp|O35147|BAD_RAT'.
  puts entry.definition         # Gets the complete fasta description line.
  puts entry.seq                # Gets the actual sequence.
  # do something on each fasta sequence entry
end

##############

# Creates a new file named "outfile.fasta" and writes
# multiple sequence alignment 'msa' to it in fasta format.
File.open('outfile.fasta', 'w') do |f|
  f.write(msa.output(:fasta))
end

# Other formats
File.open('outfile.clustal', 'w') do |f|
  f.write(msa.output(:clustal))
end
File.open('outfile.phylip', 'w') do |f|
  f.write(msa.output(:phylip))
end
File.open('outfile.phylipnon', 'w') do |f|
  f.write(msa.output(:phylipnon))
end
File.open('outfile.msf', 'w') do |f|
  f.write(msa.output(:msf))
end
File.open('outfile.molphy', 'w') do |f|
  f.write(msa.output(:molphy))
end


#############

seq1 = Bio::Sequence.auto("gggggg")


puts seq1.output(:fasta)
#seq2 = Bio::Sequence::AA.new("ggggt")
#seq3 = Bio::Sequence::AA.new("ggt")


seqs = ['MFQIPEFEPSEQEDSSSAER',
        'MGTPKQPSLAPAHALGLRKS',
        'PKQPSLAPAHALGLRKS',
        'MCSTSGCDLE'] 


# MAFFT
options = [ '--maxiterate', '1000', '--localpair' ]
mafft = Bio::MAFFT.new('mafft', options )
report = mafft.query_align( seqs)

# Accesses the actual alignment
align = report.alignment

# Prints each sequence to the console.
align.each { |s| puts s.to_s }


puts 'MAFFT OK'
puts

#clustalw
clustalw = Bio::ClustalW.new('/home/zma/SOFTWARE/clustalw-2.1/src/clustalw2' )
report = clustalw.query_align( seqs)
#puts report.alignment.output_fasta.to_s
report.alignment.each { |x| puts x.to_s }
puts 'OK'
puts

#muscle
options = [ '-quiet', '-maxiters', '64' ]
muscle = Bio::Muscle.new('/home/zma/SOFTWARE/muscle3.8.31/src/muscle', options )
report = muscle.query_align( seqs)
#puts report.alignment.output_fasta.to_s
report.alignment.each { |x| puts x.to_s }
puts 'OK'
puts

file = Bio::FastaFormat.open('bcl2.fasta')
file.each do |entry|
  puts entry.entry_id           # Gets the identifier, e.g. 'sp|O35147|BAD_RAT'.
  puts entry.definition         # Gets the complete fasta description line.
  puts entry.seq                # Gets the actual sequence.
  puts entry.aaseq.composition  # Gets the amino acid composition. 
end
puts 'OK'
puts

Bio::FlatFile.auto('bcl2.fasta') do |ff|
  ff.each do |entry|
    puts entry.entry_id           # Gets the identifier, e.g. 'sp|O35147|BAD_RAT'.
    puts entry.definition         # Gets the complete fasta description line.
    puts entry.seq                # Gets the actual sequence.
    puts entry.aaseq.composition  # Gets the amino acid composition.
  end
end
puts 'OK'
puts