用户工具

站点工具


个性化条目:共有peak

共有peak

脚本

/TJPROJ6/RNA_SH/personal_dir/yangdan/new/gongdan/peak_venn


perl peak_overlap_venn.pl \
  -peakfile peakfile.txt \
  -outdir . \
  -mode peak

具体脚本

#!/usr/bin/perl
use Getopt::Long;
use File::Basename qw(basename dirname);

my $ver    = "1.0";
my $Writer = "chenzixi\@novogene.com";
my $Data   = "2019/12/25";
#######################################################################################
# ------------------------------------------------------------------
# GetOptions
# ------------------------------------------------------------------
my ($peakfile,$outdir,$mode);
GetOptions(
                        "h|?" =>\&help,
                        "peakfile:s"=>\$peakfile,
                        "outdir:s"=>\$outdir,
						"mode:s"=>\$mode,
                        ) || &help;
&help unless ($peakfile && $outdir );
sub help
{
        print <<"    Usage End.";
        Description:
        Writer  : $Writer
        Data    : $Data
        Version : $ver
        function: ......
        Usage:
                -peakfile    peakfile, eg /TJPROJ1/RNA/WORK/Pipline/aftersale/peak_overlap_venn/testdata/peakfile.txt   Required

                -outdir      output result dir                                                                          Required

				-mode		 peak or dml[peak]																		Optional

                -h           Help                                                                                       document

#################
for DML mode,use both start/end as the position(start=end)
#################

    Usage End.
        exit;
}
# ------------------------------------------------------------------
# GetOptions End
# ------------------------------------------------------------------
my @pallete=qw/#E43B2D #377EB7 #4DAF4A #984EA3 #F27E33 #FEF840 #A65629 #F180BF #999999/;
$mode||="peak";
my $min=1;

if (($mode ne "peak")&&($mode ne "dml")){
	die "only peak/dml mode suppported, please check!\n";
}


my %samplelist;
my @samples;
my $one_dml_file;
open (IN,"< $peakfile") || die $!;
while(<IN>){
    chomp;
    my @line=split /\t/;
    $samplelist{$line[0]}=$line[1];
	$one_dml_file=$line[1];
    push @samples,$line[0];
}
close IN;

### Test start=end if using DML mode
if ($mode eq "dml"){
	open (IN,"$one_dml_file");
	my $line1=<IN>;
	close IN;
	chomp $line1;
	my @line=split(/\t/,$line1);
	die "If using dml mode, the start and end position should be the same. Please check!\n" if($line[1] != $line[2]);

}


my $remove=scalar @pallete - scalar @samples;#print $remove;
for(my $i=0;$i<$remove;$i++){
    pop @pallete;
}
my $colors="\"".join("\",\"",@pallete)."\"";

chdir($outdir);
my $sh="$outdir\/Peak_Overlap.r";
open (SH,"> $sh") || die $!;
print SH <<"  END.";
library(ChIPpeakAnno)

  END.

my $i=0;
foreach my $sample (@samples){
    $i++;
    print SH <<"  END.";
###  read file for $sample
data$i<-read.delim("$samplelist{$sample}",header=F,sep = "\\t")
$sample<-unique(GRanges(seqnames=data$i\[,1],
               ranges=IRanges(start=data$i\[,2],
                              end=data$i\[,3],
                              names=paste(data$i\[,1],data$i\[,2],data$i\[,3],sep=":")),
               strand=rep("+",length(data$i\[,1]))))
  END.
}

my $allsample=join(",",@samples);
print SH <<"  END.";
### overlap peaks
ol <- findOverlapsOfPeaks($allsample,minoverlap=$min,
                          connectedPeaks="merge")
### make venn
pdf("$outdir\/Peak_Overlap.pdf")
makeVennDiagram(ol, col="#00000000",euler.d=TRUE,scaled=TRUE,
                fill=c($colors),
                margin=c(0.05,0.05,0.05,0.05))
dev.off()
system("convert -density 1200 -resize 600 $outdir\/Peak_Overlap.pdf $outdir\/Peak_Overlap.png")
### output overlap peaklist
for (i in names(ol\$peaklist)){
  change<-gsub("///","_",i)
  filename<-paste(change,"all.id.xls",sep=".")
  temp<-as.data.frame(ol\$peaklist[[i]])
  for (j in c(1:length(temp\$peakNames))){
    temp\$samplepeaks[j]<-paste(as.vector(temp\$peakNames[[j]]),collapse = ";")
  }
  temp <- subset(temp, select = -peakNames)
  write.table(temp,filename,sep = "\t",quote=F,row.names = F,col.names = F)
  rm(temp)
}
  END.
close SH;
#`/PUBLIC/software/RNA/R/R-3.5.1/bin/Rscript $sh`;
`source /TJPROJ1/RNA/WORK/software/ChIPpeakAnno_dev/source_before_use;/TJPROJ1/RNA/WORK/software/ChIPpeakAnno_dev/R-4.0.2/bin/Rscript $sh`;
#`echo source /TJPROJ1/RNA/WORK/software/ChIPpeakAnno_dev/source_before_use > $outdir\/Peak_Overlap.sh`;
#`echo /TJPROJ1/RNA/WORK/software/ChIPpeakAnno_dev/R-4.0.2/bin/Rscript $sh >> $outdir\/Peak_Overlap.sh`;
#`sh $outdir\/Peak_Overlap.sh`;
`ls $outdir\/*.xls|xargs sed -i '1ichr\tstart\tend\tlength\tstrand\tsamplepeak'`;
个性化条目/共有peak.txt · 最后更改: 2024/09/27 01:38 由 fengjie