<?xml version='1.0'?><rss version="2.0" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:georss="http://www.georss.org/georss" xmlns:atom="http://www.w3.org/2005/Atom" >
<channel>
	<title><![CDATA[BOL: Owner]]></title>
	<link>https://bioinformaticsonline.com/snippets/owner/bulbul?</link>
	<atom:link href="https://bioinformaticsonline.com/snippets/owner/bulbul?" rel="self" type="application/rss+xml" />
	<description><![CDATA[]]></description>
	
	<item>
	<guid isPermaLink="true">https://bioinformaticsonline.com/snippets/view/30354/perl-script-to-remove-the-duplicate-sequences-from-multifasta-file</guid>
	<pubDate>Fri, 23 Dec 2016 08:47:47 -0600</pubDate>
	<link>https://bioinformaticsonline.com/snippets/view/30354/perl-script-to-remove-the-duplicate-sequences-from-multifasta-file</link>
	<title><![CDATA[Perl script to remove the duplicate sequences from multifasta file]]></title>
	<description><![CDATA[<code>use strict;
use Bio::SeqIO;
my %unique;

my $file   = &quot;myseqs.fa&quot;;
my $seqio  = Bio::SeqIO-&gt;new(-file =&gt; $file, -format =&gt; &quot;fasta&quot;);
my $outseq = Bio::SeqIO-&gt;new(-file =&gt; &quot;&gt;$file.uniq&quot;, -format =&gt; &quot;fasta&quot;);

while(my $seqs = $seqio-&gt;next_seq) {
  my $id  = $seqs-&gt;display_id;
  my $seq = $seqs-&gt;seq;
  unless(exists($unique{$seq})) {
    $outseq-&gt;write_seq($seqs);
    $unique{$seq} +=1;
  }
}</code>]]></description>
	<dc:creator>Bulbul</dc:creator>
</item>

</channel>
</rss>