#!/usr/bin/env perl

# find repeats in all of the phage genomes.

# the repeats must be within 2kb of the start and end. 
# Actually: 
#   left_start must be 1,
#   left_end must be Sherwood phage start + 100
#   right_start must be sherwood phage end - 100
#   right_end must be length of sequence

use strict;
use Bio::SeqIO;
use RepeatFinder;

my $usage=<<EOF;
-f 	file
-m 	minimum size
-ls	left start
-le	left end
-rs	right start
-re 	right end
-n	near-to distance

my ($file, $min, $leftstart, $leftend, $rightstart, $rightend, $near);

while (@ARGV)
	my $t=shift @ARGV;
	if ($t eq "-f")  {$file=shift}
	if ($t eq "-m")  {$min=shift}
	if ($t eq "-ls") {$leftstart=shift}
	if ($t eq "-le") {$leftend=shift}
	if ($t eq "-rs") {$rightstart=shift}
	if ($t eq "-re") {$rightend=shift}
	if ($t eq "-n")  {$near=shift}

$min=10 unless ($min);

die $usage unless $file;
my $seqin=Bio::SeqIO->new(-file=>"$file");
my $seqout=Bio::SeqIO->new(-file=>">$file.repeats.gbk", -format=>'genbank');

while (my $seq=$seqin->next_seq) {
  my $rep=RepeatFinder->new(-seq=>$seq, -minimum=>$min);
  if ($leftstart) {$rep->left_start($leftstart)}
  if ($leftend) {$rep->left_end($leftend)}
  if ($rightstart) {$rep->right_start($rightstart)}
  if ($rightend) {$rep->right_end($rightend)}
 my $newseq=$rep->joined_repeats;

