1.hmmer

convalign.py stockholm file.aln(file.fasta)

hmmbuild –amino file.hmm file.sth

hmmsearch -o file.hmm.hit –noali –nobias file.hmm targetPep.fasta

 

 

2.blast

短序列
psiblast -query AT4G13850.1 -db ../../../conservation/subject/AT4G13850.1 -out AT4G13850.1.out -num_iterations 3 -evalue 20000 -matrix PAM30 -comp_based_stats 0

psiblast -query $(basename $@) -db /data7T/mercu-b-backup/pu b-data/NCBI-NR/nr -out $@ -outfmt 0 -num_threads 8 -threshold 0.005 -eval ue 10 -max_target_seqs 1000 -num_iterations 10 -inclusion_ethresh 0.002

#file.fasta由clustralw等多序列比对软件生成

psiblast -in_msa file.fasta ../../../conservation/subject/AT4G13850.1 -out AT4G13850.1.out -num_iterations 3 -evalue 20000 -matrix PAM30 -comp_based_stats 0

 

#返回fasta格式的数据

blastdbcmd -entry NP_172083.1 -db /data7T/mercu-b-backup/pub-data/NCBI-NR/nr

#自定义输出格式

blastp -query 1PP2.L.fasta -db /data7T/mercu-b-backup/pub-data/NCBI-NR/nr -out 1PP2.L.fasta.out.0 -num_threads=8 -outfmt=’6 qseqid sseqid pident length slen evalue’

http://www.ncbi.nlm.nih.gov/blast/html/sub_matrix.html

短序列 psiblast -query AT4G13850.1 -db ../../../conservation/subject/AT4G13850.1 -out AT4G13850.1.out -num_iterations 3 -evalue 20000 -matrix PAM30 -comp_based_stats 0

psiblast -query $(basename $@) -db /data7T/mercu-b-backup/pu b-data/NCBI-NR/nr -out $@ -outfmt 0 -num_threads 8 -threshold 0.005 -eval ue 10 -max_target_seqs 1000 -num_iterations 10 -inclusion_ethresh 0.002

#file.fasta由clustralw等多序列比对软件生成

psiblast -in_msa file.fasta ../../../conservation/subject/AT4G13850.1 -out AT4G13850.1.out -num_iterations 3 -evalue 20000 -matrix PAM30 -comp_based_stats 0

#返回fasta格式的数据

blastdbcmd -entry NP_172083.1 -db /data7T/mercu-b-backup/pub-data/NCBI-NR/nr

#自定义输出格式

blastp -query 1PP2.L.fasta -db /data7T/mercu-b-backup/pub-data/NCBI-NR/nr -out 1PP2.L.fasta.out.0 -num_threads=8 -outfmt=’6 qseqid sseqid pident length slen evalue’

http://www.ncbi.nlm.nih.gov/blast/html/sub_matrix.html

3.meme  [http://meme.sdsc.edu/meme/doc/meme.html]

meme F1_MEF.macs_peaks.pv2000.bed.fa -dna -nmotifs 1000 -evt 0.001 -revcomp \
-mod anr -minsites 50 -maxsites 10000 \
-maxsize `cat F1_MEF.macs_peaks.pv2000.bed.fa | wc -c` \
-oc F1_MEF.macs_peaks.pv2000.meme

 

 

4.meme修改

mcast调用mhhmscan出现错误 sh: line 1: 11764 Aborted

FATAL: mhmmscan failed with exit status 134, command run was:

 

Revise:

run with another parameter –blocksize

 

$(cell).macs_peaks.pv2000.homer: $(cell).macs_peaks.pv2000.bed

findMotifsGenome.pl $< mm9 $@ -size given -p 6
pythonmail2.py $@ $@

$(cell).macs_peaks.pv2000.meme-fimo-uniprobe: $(cell).macs_peaks.pv2000.bed.fa
fimo –output-qthresh 0.1 –max-seq-length 2.5e8 \
–oc $@ –max-stored-scores 1000000000 \
~/soft/meme/db/motif_databases/uniprobe_mouse.meme $<
pythonmail2.py $@ $@
tail -n +2 $@/fimo.txt | cut -f 1 | sort | uniq -c | sed ‘s/^ *//’ \
| awk ‘BEGIN{OFS=”\t”;FS=” “;}{print \(2,\)1}’ | sort -k1,1 \

$@/fimo.txt.motif.pattern.cnt
join -a1 -t ‘ ‘ -o 2.2,1.2 \
$@/fimo.txt.motif.pattern.cnt $(uniprobe_tf) \
$@/fimo.txt.motif.tf.cnt
$(cell).macs_peaks.pv2000.meme-mcast-uniprobe: $(cell).macs_peaks.pv2000.bed.fa
mkdir -p $@
mhmm –type star –keep-unused –verbosity 2 \
/home/chentong/soft/meme/db/motif_databases/uniprobe_mouse.meme \
$@/uniprobe_mouse.meme.mhmm
mhmmscan –fancy –allow-weak-motifs –p-thresh 0.0005 \
–max-gap 50 –e-thresh 10 –eg-cost 1 \
–blocksize \
`gawk ‘{if(x<length()) x = length()}END{print x}’ $<` \
–verbosity 5 –pseudo-weight 4.0 \
$@/uniprobe_mouse.meme.mhmm $< \
$@/mcast.txt
mhmm2html $@/mcast.txt >$@/mcast.html
pythonmail2.py $@ $@

 

5.

6.

7.

8.

9.

10.

11.

12.

13.

14.

15.

16.

17.

18.

19.

20.