SlideShare une entreprise Scribd logo
1  sur  17
•
    •
    •
•
    •
•
•

        GCATGCAT
    A
    C
    G
    T
    T
    C
    G
    T
•
    •
•
    •
•
    •
    •
        •
•
            •
            •
BLASTN 2.2.16 [Mar-25-2007]

Reference: Altschul, Stephen F., Thomas L. Madden, Alejandro A. Schaffer,
Jinghui Zhang, Zheng Zhang, Webb Miller, and David J. Lipman (1997),
quot;Gapped BLAST and PSI-BLAST: a new generation of protein database search
programsquot;, Nucleic Acids Res. 25:3389-3402.

Query= ORFN:12 Multiple, Contig c912 1285-2874 reverse complement
         (1590 letters)
Database: yeast.nt
           17 sequences; 12,155,026 total letters
Searching..................................................done

                                                                 Score    E
Sequences producing significant alignments:                      (bits) Value

ref|NC_001143.1| Saccharomyces cerevisiae chromosome XI, complet...    72   4e-12
ref|NC_001133.1| Saccharomyces cerevisiae chromosome I, complete...    72   4e-12
>ref|NC_001143.1| Saccharomyces cerevisiae chromosome XI, complete chromosome
sequence
           Length = 666445
 Score = 71.9 bits (36), Expect = 4e-12
 Identities = 75/88 (85%)
 Strand = Plus / Plus
Query: 946     attactgttacttcctgtgagtctggtgtctgctctgaaaccgcttctcccgctattgtt 1005
               ||||| |||||||| ||||||||||||||||| || ||||| ||||| || ||||| |||
Sbjct: 648979 attacggttacttcttgtgagtctggtgtctgttccgaaactgcttcacctgctatcgtt 649038

Query: 1006   tccacagccacaaccaccatcaatgatg 1033
              || |||||||| | ||| |||||||||
Sbjct: 649039 tcgacagccactgctaccgtcaatgatg 649066

 Score = 71.9 bits (36), Expect = 4e-12
 Identities = 75/88 (85%)
 Strand = Plus / Plus

Query: 1099   attactgttacttcctgtgagtctggtgtctgctctgaaaccgcttctcccgctattgtt 1158
              ||||| |||||||| ||||||||||||||||| || ||||| ||||| || ||||| |||
Sbjct: 648979 attacggttacttcttgtgagtctggtgtctgttccgaaactgcttcacctgctatcgtt 649038

Query: 1159   tccacagccacaaccaccatcaatgatg 1186
              || |||||||| | ||| |||||||||
Sbjct: 649039 tcgacagccactgctaccgtcaatgatg 649066

 Score = 44.1 bits (22), Expect = 0.001
 Identities = 31/34 (91%)
 Strand = Plus / Plus

Query: 1479   atctagcaccgcctctttagaaatgtcaagctac 1512
              |||||| || ||||||||||| ||||||||||||
$ cd ~/work/blast/bayanus/
$ curl -o 12.genome.fasta quot;http://eutils.ncbi.nlm.nih.gov/entrez/eutils/
efetch.fcgi?
db=genome&id=NC_001143.1&seq_start=648879&seq_stop=649166&strand=1&rettype=fastaquot;




>gi|6322623:648879-649066 Saccharomyces cerevisiae chromosome XI, complete
chromosome sequence
CATCAATGGGATTACCACTGAATATACTACATGGTGCCCTCTTTCTGCTACGGAATTAACAACGGTAAGT
AAATTAGAGTCAGAAGAAAAAACCACCCTAATTACGGTTACTTCTTGTGAGTCTGGTGTCTGTTCCGAAA
CTGCTTCACCTGCTATCGTTTCGACAGCCACTGCTACCGTCAATGATG
•
    •
•
    •
    •
    •
        •
    •
        •

•
•
    •
    •
    •
    •
jsmbp:~ sesejun$ sudo port -d selfupdate
(                      PC


jsmbp:~ sesejun$ sudo port -d install ImageMagick

jsmbp:~ sesejun$ sudo port -d install ghostscript
•
•
•
jsmbp:~ sesejun$ mkdir bin
jsmbp:~ sesejun$ cd bin
jsmbp:~/bin sesejun$ lftp ftp://emboss.open-bio.org/pub/EMBOSS
lftp emboss.open-bio.org:/pub/EMBOSS> mget EMBOSS-5.0.0.tar.gz
(
lftp emboss.open-bio.org:/pub/EMBOSS> quit
jsmbp:~/bin sesejun$ tar zxvf EMBOSS-5.0.0.tar.gz
(
jsmbp:~/bin sesejun$ cd EMBOSS-5.0.0
jsmbp:~/bin sesejun$ ./configure
(
jsmbp:~/bin sesejun$ make
(
•
    •
•
    •
•
    •
    •
•
    •
    •
•
   •



$ ~/bin/EMBOSS-5.0.0/emboss/dotmatcher 12.genome.fasta 12.fasta
-graph ps -threshold 35 -goutfile 12.fasta
  12.fasta.ps
$ convert 12.fasta.ps 12.fasta.png
  ImageMagick
$ open 12.fasta.png
  12.fasta.png
A    T    G    C    S    W    R    Y    K    M    B    V    H    D    N    U
A    5   -4   -4   -4   -4    1    1   -4   -4    1   -4   -1   -1   -1   -2   -4
T   -4    5   -4   -4   -4    1   -4    1    1   -4   -1   -4   -1   -1   -2    5
G   -4   -4    5   -4    1   -4    1   -4    1   -4   -1   -1   -4   -1   -2   -4
C   -4   -4   -4    5    1   -4   -4    1   -4    1   -1   -1   -1   -4   -2   -4
S   -4   -4    1    1   -1   -4   -2   -2   -2   -2   -1   -1   -3   -3   -1   -4
W    1    1   -4   -4   -4   -1   -2   -2   -2   -2   -3   -3   -1   -1   -1    1
R    1   -4    1   -4   -2   -2   -1   -4   -2   -2   -3   -1   -3   -1   -1   -4
Y   -4    1   -4    1   -2   -2   -4   -1   -2   -2   -1   -3   -1   -3   -1    1
K   -4    1    1   -4   -2   -2   -2   -2   -1   -4   -1   -3   -3   -1   -1    1
M    1   -4   -4    1   -2   -2   -2   -2   -4   -1   -3   -1   -1   -3   -1   -4
B   -4   -1   -1   -1   -1   -3   -3   -1   -1   -3   -1   -2   -2   -2   -1   -1
V   -1   -4   -1   -1   -1   -3   -1   -3   -3   -1   -2   -1   -2   -2   -1   -4
H   -1   -1   -4   -1   -3   -1   -3   -1   -3   -1   -2   -2   -1   -2   -1   -1
D   -1   -1   -1   -4   -3   -1   -1   -3   -1   -3   -2   -2   -2   -1   -1   -1
N   -2   -2   -2   -2   -1   -1   -1   -1   -1   -1   -1   -1   -1   -1   -1   -2
U   -4    5   -4   -4   -4    1   -4    1    1   -4   -1   -4   -1   -1   -2    5
•
•
    •
    •
    •
    •
•
    •
        •
    •
        •
#!/bin/bash

for i in *.fasta.result;do
  n=`echo $i | sed 's/..*//'`
  echo $n
  url=`ruby blastparse.rb $n.fasta.result`
  case $url in
       http*)
           echo $url
           curl -s -o $n.genome.fasta $url
           ~/bin/EMBOSS-5.0.0/emboss/dotmatcher $n.genome.fasta
$n.fasta -graph ps -threshold 35 -goutfile $n.fasta
           convert $n.fasta.ps $n.fasta.png
           ;;
  esac
done



10
http://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?
db=genome&id=NC_001142.1&seq_start=722530&seq_stop=723085&strand
=2&rettype=fasta
Displays a thresholded dotplot of two sequences
Created 10.fasta.ps
101
http://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?
db=genome&id=NC_001146.1&seq_start=57506&seq_stop=57900&strand=1
&rettype=fasta
Displays a thresholded dotplot of two sequences
Created 101.fasta.ps
•
•
    •
    1.
    2.
    3.
    4.
•

•

Contenu connexe

Similaire à bioinfo_6th_20070720

Genetic Algorithm (GA) Optimization - Step-by-Step Example
Genetic Algorithm (GA) Optimization - Step-by-Step ExampleGenetic Algorithm (GA) Optimization - Step-by-Step Example
Genetic Algorithm (GA) Optimization - Step-by-Step ExampleAhmed Gad
 
2016.09.28TOPIC REVIEW• Exam • PS2 Sequence Alignment .docx
2016.09.28TOPIC REVIEW• Exam • PS2 Sequence Alignment .docx2016.09.28TOPIC REVIEW• Exam • PS2 Sequence Alignment .docx
2016.09.28TOPIC REVIEW• Exam • PS2 Sequence Alignment .docxfelicidaddinwoodie
 
PSLDoc: Protein subcellular localization prediction based on gapped-dipeptide...
PSLDoc: Protein subcellular localization prediction based on gapped-dipeptide...PSLDoc: Protein subcellular localization prediction based on gapped-dipeptide...
PSLDoc: Protein subcellular localization prediction based on gapped-dipeptide...JIA-MING CHANG
 
вестник южно уральского-государственного_университета._серия_математика._меха...
вестник южно уральского-государственного_университета._серия_математика._меха...вестник южно уральского-государственного_университета._серия_математика._меха...
вестник южно уральского-государственного_университета._серия_математика._меха...Иван Иванов
 
Gráfico ponto cruz em PDF
Gráfico ponto cruz em PDFGráfico ponto cruz em PDF
Gráfico ponto cruz em PDFcelsomaria
 
AP EAMCET 2016 Engineering Answer Key
AP EAMCET 2016 Engineering Answer KeyAP EAMCET 2016 Engineering Answer Key
AP EAMCET 2016 Engineering Answer KeyEneutron
 
AP EAMCET 2016 Medical Answer Key
AP EAMCET 2016 Medical Answer KeyAP EAMCET 2016 Medical Answer Key
AP EAMCET 2016 Medical Answer KeyEneutron
 
Mechanical Set Packers
Mechanical Set PackersMechanical Set Packers
Mechanical Set Packersdicoiltools
 
RNASeqR: RNA-Seq workflow for case-control study
RNASeqR: RNA-Seq workflow for case-control studyRNASeqR: RNA-Seq workflow for case-control study
RNASeqR: RNA-Seq workflow for case-control studyKuanHaoChao
 
三菱Plc
三菱Plc三菱Plc
三菱Plcwxm1109
 

Similaire à bioinfo_6th_20070720 (20)

Sequence Analysis.ppt
Sequence Analysis.pptSequence Analysis.ppt
Sequence Analysis.ppt
 
Genetic Algorithm (GA) Optimization - Step-by-Step Example
Genetic Algorithm (GA) Optimization - Step-by-Step ExampleGenetic Algorithm (GA) Optimization - Step-by-Step Example
Genetic Algorithm (GA) Optimization - Step-by-Step Example
 
2016.09.28TOPIC REVIEW• Exam • PS2 Sequence Alignment .docx
2016.09.28TOPIC REVIEW• Exam • PS2 Sequence Alignment .docx2016.09.28TOPIC REVIEW• Exam • PS2 Sequence Alignment .docx
2016.09.28TOPIC REVIEW• Exam • PS2 Sequence Alignment .docx
 
PSLDoc: Protein subcellular localization prediction based on gapped-dipeptide...
PSLDoc: Protein subcellular localization prediction based on gapped-dipeptide...PSLDoc: Protein subcellular localization prediction based on gapped-dipeptide...
PSLDoc: Protein subcellular localization prediction based on gapped-dipeptide...
 
вестник южно уральского-государственного_университета._серия_математика._меха...
вестник южно уральского-государственного_университета._серия_математика._меха...вестник южно уральского-государственного_университета._серия_математика._меха...
вестник южно уральского-государственного_университета._серия_математика._меха...
 
Accelerate performance
Accelerate performanceAccelerate performance
Accelerate performance
 
How to caculus
How to caculusHow to caculus
How to caculus
 
4
44
4
 
Gráfico ponto cruz em PDF
Gráfico ponto cruz em PDFGráfico ponto cruz em PDF
Gráfico ponto cruz em PDF
 
AP EAMCET 2016 Engineering Answer Key
AP EAMCET 2016 Engineering Answer KeyAP EAMCET 2016 Engineering Answer Key
AP EAMCET 2016 Engineering Answer Key
 
AP EAMCET 2016 Medical Answer Key
AP EAMCET 2016 Medical Answer KeyAP EAMCET 2016 Medical Answer Key
AP EAMCET 2016 Medical Answer Key
 
Sanitary Adapters
Sanitary AdaptersSanitary Adapters
Sanitary Adapters
 
Zynga adder
Zynga adderZynga adder
Zynga adder
 
Mechanical Set Packers
Mechanical Set PackersMechanical Set Packers
Mechanical Set Packers
 
งานคอม9 16
งานคอม9 16งานคอม9 16
งานคอม9 16
 
Similarity
SimilaritySimilarity
Similarity
 
Dmxchart
DmxchartDmxchart
Dmxchart
 
RNASeqR: RNA-Seq workflow for case-control study
RNASeqR: RNA-Seq workflow for case-control studyRNASeqR: RNA-Seq workflow for case-control study
RNASeqR: RNA-Seq workflow for case-control study
 
三菱Plc
三菱Plc三菱Plc
三菱Plc
 
Allegato 2
Allegato 2Allegato 2
Allegato 2
 

Plus de sesejun

RNAseqによる変動遺伝子抽出の統計: A Review
RNAseqによる変動遺伝子抽出の統計: A ReviewRNAseqによる変動遺伝子抽出の統計: A Review
RNAseqによる変動遺伝子抽出の統計: A Reviewsesejun
 
バイオインフォマティクスによる遺伝子発現解析
バイオインフォマティクスによる遺伝子発現解析バイオインフォマティクスによる遺伝子発現解析
バイオインフォマティクスによる遺伝子発現解析sesejun
 
次世代シーケンサが求める機械学習
次世代シーケンサが求める機械学習次世代シーケンサが求める機械学習
次世代シーケンサが求める機械学習sesejun
 
20110602labseminar pub
20110602labseminar pub20110602labseminar pub
20110602labseminar pubsesejun
 
20110524zurichngs 2nd pub
20110524zurichngs 2nd pub20110524zurichngs 2nd pub
20110524zurichngs 2nd pubsesejun
 
20110524zurichngs 1st pub
20110524zurichngs 1st pub20110524zurichngs 1st pub
20110524zurichngs 1st pubsesejun
 
20110214nips2010 read
20110214nips2010 read20110214nips2010 read
20110214nips2010 readsesejun
 
Datamining 9th association_rule.key
Datamining 9th association_rule.keyDatamining 9th association_rule.key
Datamining 9th association_rule.keysesejun
 
Datamining 8th hclustering
Datamining 8th hclusteringDatamining 8th hclustering
Datamining 8th hclusteringsesejun
 
Datamining r 4th
Datamining r 4thDatamining r 4th
Datamining r 4thsesejun
 
Datamining r 3rd
Datamining r 3rdDatamining r 3rd
Datamining r 3rdsesejun
 
Datamining r 2nd
Datamining r 2ndDatamining r 2nd
Datamining r 2ndsesejun
 
Datamining r 1st
Datamining r 1stDatamining r 1st
Datamining r 1stsesejun
 
Datamining 6th svm
Datamining 6th svmDatamining 6th svm
Datamining 6th svmsesejun
 
Datamining 5th knn
Datamining 5th knnDatamining 5th knn
Datamining 5th knnsesejun
 
Datamining 4th adaboost
Datamining 4th adaboostDatamining 4th adaboost
Datamining 4th adaboostsesejun
 
Datamining 3rd naivebayes
Datamining 3rd naivebayesDatamining 3rd naivebayes
Datamining 3rd naivebayessesejun
 
Datamining 2nd decisiontree
Datamining 2nd decisiontreeDatamining 2nd decisiontree
Datamining 2nd decisiontreesesejun
 
Datamining 7th kmeans
Datamining 7th kmeansDatamining 7th kmeans
Datamining 7th kmeanssesejun
 
100401 Bioinfoinfra
100401 Bioinfoinfra100401 Bioinfoinfra
100401 Bioinfoinfrasesejun
 

Plus de sesejun (20)

RNAseqによる変動遺伝子抽出の統計: A Review
RNAseqによる変動遺伝子抽出の統計: A ReviewRNAseqによる変動遺伝子抽出の統計: A Review
RNAseqによる変動遺伝子抽出の統計: A Review
 
バイオインフォマティクスによる遺伝子発現解析
バイオインフォマティクスによる遺伝子発現解析バイオインフォマティクスによる遺伝子発現解析
バイオインフォマティクスによる遺伝子発現解析
 
次世代シーケンサが求める機械学習
次世代シーケンサが求める機械学習次世代シーケンサが求める機械学習
次世代シーケンサが求める機械学習
 
20110602labseminar pub
20110602labseminar pub20110602labseminar pub
20110602labseminar pub
 
20110524zurichngs 2nd pub
20110524zurichngs 2nd pub20110524zurichngs 2nd pub
20110524zurichngs 2nd pub
 
20110524zurichngs 1st pub
20110524zurichngs 1st pub20110524zurichngs 1st pub
20110524zurichngs 1st pub
 
20110214nips2010 read
20110214nips2010 read20110214nips2010 read
20110214nips2010 read
 
Datamining 9th association_rule.key
Datamining 9th association_rule.keyDatamining 9th association_rule.key
Datamining 9th association_rule.key
 
Datamining 8th hclustering
Datamining 8th hclusteringDatamining 8th hclustering
Datamining 8th hclustering
 
Datamining r 4th
Datamining r 4thDatamining r 4th
Datamining r 4th
 
Datamining r 3rd
Datamining r 3rdDatamining r 3rd
Datamining r 3rd
 
Datamining r 2nd
Datamining r 2ndDatamining r 2nd
Datamining r 2nd
 
Datamining r 1st
Datamining r 1stDatamining r 1st
Datamining r 1st
 
Datamining 6th svm
Datamining 6th svmDatamining 6th svm
Datamining 6th svm
 
Datamining 5th knn
Datamining 5th knnDatamining 5th knn
Datamining 5th knn
 
Datamining 4th adaboost
Datamining 4th adaboostDatamining 4th adaboost
Datamining 4th adaboost
 
Datamining 3rd naivebayes
Datamining 3rd naivebayesDatamining 3rd naivebayes
Datamining 3rd naivebayes
 
Datamining 2nd decisiontree
Datamining 2nd decisiontreeDatamining 2nd decisiontree
Datamining 2nd decisiontree
 
Datamining 7th kmeans
Datamining 7th kmeansDatamining 7th kmeans
Datamining 7th kmeans
 
100401 Bioinfoinfra
100401 Bioinfoinfra100401 Bioinfoinfra
100401 Bioinfoinfra
 

Dernier

Axa Assurance Maroc - Insurer Innovation Award 2024
Axa Assurance Maroc - Insurer Innovation Award 2024Axa Assurance Maroc - Insurer Innovation Award 2024
Axa Assurance Maroc - Insurer Innovation Award 2024The Digital Insurer
 
presentation ICT roal in 21st century education
presentation ICT roal in 21st century educationpresentation ICT roal in 21st century education
presentation ICT roal in 21st century educationjfdjdjcjdnsjd
 
What Are The Drone Anti-jamming Systems Technology?
What Are The Drone Anti-jamming Systems Technology?What Are The Drone Anti-jamming Systems Technology?
What Are The Drone Anti-jamming Systems Technology?Antenna Manufacturer Coco
 
GenAI Risks & Security Meetup 01052024.pdf
GenAI Risks & Security Meetup 01052024.pdfGenAI Risks & Security Meetup 01052024.pdf
GenAI Risks & Security Meetup 01052024.pdflior mazor
 
Finology Group – Insurtech Innovation Award 2024
Finology Group – Insurtech Innovation Award 2024Finology Group – Insurtech Innovation Award 2024
Finology Group – Insurtech Innovation Award 2024The Digital Insurer
 
Partners Life - Insurer Innovation Award 2024
Partners Life - Insurer Innovation Award 2024Partners Life - Insurer Innovation Award 2024
Partners Life - Insurer Innovation Award 2024The Digital Insurer
 
Strategies for Landing an Oracle DBA Job as a Fresher
Strategies for Landing an Oracle DBA Job as a FresherStrategies for Landing an Oracle DBA Job as a Fresher
Strategies for Landing an Oracle DBA Job as a FresherRemote DBA Services
 
Scaling API-first – The story of a global engineering organization
Scaling API-first – The story of a global engineering organizationScaling API-first – The story of a global engineering organization
Scaling API-first – The story of a global engineering organizationRadu Cotescu
 
ProductAnonymous-April2024-WinProductDiscovery-MelissaKlemke
ProductAnonymous-April2024-WinProductDiscovery-MelissaKlemkeProductAnonymous-April2024-WinProductDiscovery-MelissaKlemke
ProductAnonymous-April2024-WinProductDiscovery-MelissaKlemkeProduct Anonymous
 
Handwritten Text Recognition for manuscripts and early printed texts
Handwritten Text Recognition for manuscripts and early printed textsHandwritten Text Recognition for manuscripts and early printed texts
Handwritten Text Recognition for manuscripts and early printed textsMaria Levchenko
 
TrustArc Webinar - Unlock the Power of AI-Driven Data Discovery
TrustArc Webinar - Unlock the Power of AI-Driven Data DiscoveryTrustArc Webinar - Unlock the Power of AI-Driven Data Discovery
TrustArc Webinar - Unlock the Power of AI-Driven Data DiscoveryTrustArc
 
Data Cloud, More than a CDP by Matt Robison
Data Cloud, More than a CDP by Matt RobisonData Cloud, More than a CDP by Matt Robison
Data Cloud, More than a CDP by Matt RobisonAnna Loughnan Colquhoun
 
Exploring the Future Potential of AI-Enabled Smartphone Processors
Exploring the Future Potential of AI-Enabled Smartphone ProcessorsExploring the Future Potential of AI-Enabled Smartphone Processors
Exploring the Future Potential of AI-Enabled Smartphone Processorsdebabhi2
 
Automating Google Workspace (GWS) & more with Apps Script
Automating Google Workspace (GWS) & more with Apps ScriptAutomating Google Workspace (GWS) & more with Apps Script
Automating Google Workspace (GWS) & more with Apps Scriptwesley chun
 
From Event to Action: Accelerate Your Decision Making with Real-Time Automation
From Event to Action: Accelerate Your Decision Making with Real-Time AutomationFrom Event to Action: Accelerate Your Decision Making with Real-Time Automation
From Event to Action: Accelerate Your Decision Making with Real-Time AutomationSafe Software
 
Real Time Object Detection Using Open CV
Real Time Object Detection Using Open CVReal Time Object Detection Using Open CV
Real Time Object Detection Using Open CVKhem
 
GenCyber Cyber Security Day Presentation
GenCyber Cyber Security Day PresentationGenCyber Cyber Security Day Presentation
GenCyber Cyber Security Day PresentationMichael W. Hawkins
 
A Domino Admins Adventures (Engage 2024)
A Domino Admins Adventures (Engage 2024)A Domino Admins Adventures (Engage 2024)
A Domino Admins Adventures (Engage 2024)Gabriella Davis
 
Boost PC performance: How more available memory can improve productivity
Boost PC performance: How more available memory can improve productivityBoost PC performance: How more available memory can improve productivity
Boost PC performance: How more available memory can improve productivityPrincipled Technologies
 

Dernier (20)

Axa Assurance Maroc - Insurer Innovation Award 2024
Axa Assurance Maroc - Insurer Innovation Award 2024Axa Assurance Maroc - Insurer Innovation Award 2024
Axa Assurance Maroc - Insurer Innovation Award 2024
 
presentation ICT roal in 21st century education
presentation ICT roal in 21st century educationpresentation ICT roal in 21st century education
presentation ICT roal in 21st century education
 
What Are The Drone Anti-jamming Systems Technology?
What Are The Drone Anti-jamming Systems Technology?What Are The Drone Anti-jamming Systems Technology?
What Are The Drone Anti-jamming Systems Technology?
 
GenAI Risks & Security Meetup 01052024.pdf
GenAI Risks & Security Meetup 01052024.pdfGenAI Risks & Security Meetup 01052024.pdf
GenAI Risks & Security Meetup 01052024.pdf
 
Finology Group – Insurtech Innovation Award 2024
Finology Group – Insurtech Innovation Award 2024Finology Group – Insurtech Innovation Award 2024
Finology Group – Insurtech Innovation Award 2024
 
Partners Life - Insurer Innovation Award 2024
Partners Life - Insurer Innovation Award 2024Partners Life - Insurer Innovation Award 2024
Partners Life - Insurer Innovation Award 2024
 
Strategies for Landing an Oracle DBA Job as a Fresher
Strategies for Landing an Oracle DBA Job as a FresherStrategies for Landing an Oracle DBA Job as a Fresher
Strategies for Landing an Oracle DBA Job as a Fresher
 
Scaling API-first – The story of a global engineering organization
Scaling API-first – The story of a global engineering organizationScaling API-first – The story of a global engineering organization
Scaling API-first – The story of a global engineering organization
 
ProductAnonymous-April2024-WinProductDiscovery-MelissaKlemke
ProductAnonymous-April2024-WinProductDiscovery-MelissaKlemkeProductAnonymous-April2024-WinProductDiscovery-MelissaKlemke
ProductAnonymous-April2024-WinProductDiscovery-MelissaKlemke
 
Handwritten Text Recognition for manuscripts and early printed texts
Handwritten Text Recognition for manuscripts and early printed textsHandwritten Text Recognition for manuscripts and early printed texts
Handwritten Text Recognition for manuscripts and early printed texts
 
TrustArc Webinar - Unlock the Power of AI-Driven Data Discovery
TrustArc Webinar - Unlock the Power of AI-Driven Data DiscoveryTrustArc Webinar - Unlock the Power of AI-Driven Data Discovery
TrustArc Webinar - Unlock the Power of AI-Driven Data Discovery
 
Data Cloud, More than a CDP by Matt Robison
Data Cloud, More than a CDP by Matt RobisonData Cloud, More than a CDP by Matt Robison
Data Cloud, More than a CDP by Matt Robison
 
+971581248768>> SAFE AND ORIGINAL ABORTION PILLS FOR SALE IN DUBAI AND ABUDHA...
+971581248768>> SAFE AND ORIGINAL ABORTION PILLS FOR SALE IN DUBAI AND ABUDHA...+971581248768>> SAFE AND ORIGINAL ABORTION PILLS FOR SALE IN DUBAI AND ABUDHA...
+971581248768>> SAFE AND ORIGINAL ABORTION PILLS FOR SALE IN DUBAI AND ABUDHA...
 
Exploring the Future Potential of AI-Enabled Smartphone Processors
Exploring the Future Potential of AI-Enabled Smartphone ProcessorsExploring the Future Potential of AI-Enabled Smartphone Processors
Exploring the Future Potential of AI-Enabled Smartphone Processors
 
Automating Google Workspace (GWS) & more with Apps Script
Automating Google Workspace (GWS) & more with Apps ScriptAutomating Google Workspace (GWS) & more with Apps Script
Automating Google Workspace (GWS) & more with Apps Script
 
From Event to Action: Accelerate Your Decision Making with Real-Time Automation
From Event to Action: Accelerate Your Decision Making with Real-Time AutomationFrom Event to Action: Accelerate Your Decision Making with Real-Time Automation
From Event to Action: Accelerate Your Decision Making with Real-Time Automation
 
Real Time Object Detection Using Open CV
Real Time Object Detection Using Open CVReal Time Object Detection Using Open CV
Real Time Object Detection Using Open CV
 
GenCyber Cyber Security Day Presentation
GenCyber Cyber Security Day PresentationGenCyber Cyber Security Day Presentation
GenCyber Cyber Security Day Presentation
 
A Domino Admins Adventures (Engage 2024)
A Domino Admins Adventures (Engage 2024)A Domino Admins Adventures (Engage 2024)
A Domino Admins Adventures (Engage 2024)
 
Boost PC performance: How more available memory can improve productivity
Boost PC performance: How more available memory can improve productivityBoost PC performance: How more available memory can improve productivity
Boost PC performance: How more available memory can improve productivity
 

bioinfo_6th_20070720

  • 1. • • • •
  • 2.
  • 3. • • GCATGCAT A C G T T C G T
  • 4. • • • • • • •
  • 5. • • BLASTN 2.2.16 [Mar-25-2007] Reference: Altschul, Stephen F., Thomas L. Madden, Alejandro A. Schaffer, Jinghui Zhang, Zheng Zhang, Webb Miller, and David J. Lipman (1997), quot;Gapped BLAST and PSI-BLAST: a new generation of protein database search programsquot;, Nucleic Acids Res. 25:3389-3402. Query= ORFN:12 Multiple, Contig c912 1285-2874 reverse complement (1590 letters) Database: yeast.nt 17 sequences; 12,155,026 total letters Searching..................................................done Score E Sequences producing significant alignments: (bits) Value ref|NC_001143.1| Saccharomyces cerevisiae chromosome XI, complet... 72 4e-12 ref|NC_001133.1| Saccharomyces cerevisiae chromosome I, complete... 72 4e-12
  • 6. >ref|NC_001143.1| Saccharomyces cerevisiae chromosome XI, complete chromosome sequence Length = 666445 Score = 71.9 bits (36), Expect = 4e-12 Identities = 75/88 (85%) Strand = Plus / Plus Query: 946 attactgttacttcctgtgagtctggtgtctgctctgaaaccgcttctcccgctattgtt 1005 ||||| |||||||| ||||||||||||||||| || ||||| ||||| || ||||| ||| Sbjct: 648979 attacggttacttcttgtgagtctggtgtctgttccgaaactgcttcacctgctatcgtt 649038 Query: 1006 tccacagccacaaccaccatcaatgatg 1033 || |||||||| | ||| ||||||||| Sbjct: 649039 tcgacagccactgctaccgtcaatgatg 649066 Score = 71.9 bits (36), Expect = 4e-12 Identities = 75/88 (85%) Strand = Plus / Plus Query: 1099 attactgttacttcctgtgagtctggtgtctgctctgaaaccgcttctcccgctattgtt 1158 ||||| |||||||| ||||||||||||||||| || ||||| ||||| || ||||| ||| Sbjct: 648979 attacggttacttcttgtgagtctggtgtctgttccgaaactgcttcacctgctatcgtt 649038 Query: 1159 tccacagccacaaccaccatcaatgatg 1186 || |||||||| | ||| ||||||||| Sbjct: 649039 tcgacagccactgctaccgtcaatgatg 649066 Score = 44.1 bits (22), Expect = 0.001 Identities = 31/34 (91%) Strand = Plus / Plus Query: 1479 atctagcaccgcctctttagaaatgtcaagctac 1512 |||||| || ||||||||||| ||||||||||||
  • 7. $ cd ~/work/blast/bayanus/ $ curl -o 12.genome.fasta quot;http://eutils.ncbi.nlm.nih.gov/entrez/eutils/ efetch.fcgi? db=genome&id=NC_001143.1&seq_start=648879&seq_stop=649166&strand=1&rettype=fastaquot; >gi|6322623:648879-649066 Saccharomyces cerevisiae chromosome XI, complete chromosome sequence CATCAATGGGATTACCACTGAATATACTACATGGTGCCCTCTTTCTGCTACGGAATTAACAACGGTAAGT AAATTAGAGTCAGAAGAAAAAACCACCCTAATTACGGTTACTTCTTGTGAGTCTGGTGTCTGTTCCGAAA CTGCTTCACCTGCTATCGTTTCGACAGCCACTGCTACCGTCAATGATG
  • 8. • • • • • • • • •
  • 9. • • • • jsmbp:~ sesejun$ sudo port -d selfupdate ( PC jsmbp:~ sesejun$ sudo port -d install ImageMagick jsmbp:~ sesejun$ sudo port -d install ghostscript
  • 10. • • • jsmbp:~ sesejun$ mkdir bin jsmbp:~ sesejun$ cd bin jsmbp:~/bin sesejun$ lftp ftp://emboss.open-bio.org/pub/EMBOSS lftp emboss.open-bio.org:/pub/EMBOSS> mget EMBOSS-5.0.0.tar.gz ( lftp emboss.open-bio.org:/pub/EMBOSS> quit jsmbp:~/bin sesejun$ tar zxvf EMBOSS-5.0.0.tar.gz ( jsmbp:~/bin sesejun$ cd EMBOSS-5.0.0 jsmbp:~/bin sesejun$ ./configure ( jsmbp:~/bin sesejun$ make (
  • 11. • • • • • • • • •
  • 12. • $ ~/bin/EMBOSS-5.0.0/emboss/dotmatcher 12.genome.fasta 12.fasta -graph ps -threshold 35 -goutfile 12.fasta 12.fasta.ps $ convert 12.fasta.ps 12.fasta.png ImageMagick $ open 12.fasta.png 12.fasta.png
  • 13. A T G C S W R Y K M B V H D N U A 5 -4 -4 -4 -4 1 1 -4 -4 1 -4 -1 -1 -1 -2 -4 T -4 5 -4 -4 -4 1 -4 1 1 -4 -1 -4 -1 -1 -2 5 G -4 -4 5 -4 1 -4 1 -4 1 -4 -1 -1 -4 -1 -2 -4 C -4 -4 -4 5 1 -4 -4 1 -4 1 -1 -1 -1 -4 -2 -4 S -4 -4 1 1 -1 -4 -2 -2 -2 -2 -1 -1 -3 -3 -1 -4 W 1 1 -4 -4 -4 -1 -2 -2 -2 -2 -3 -3 -1 -1 -1 1 R 1 -4 1 -4 -2 -2 -1 -4 -2 -2 -3 -1 -3 -1 -1 -4 Y -4 1 -4 1 -2 -2 -4 -1 -2 -2 -1 -3 -1 -3 -1 1 K -4 1 1 -4 -2 -2 -2 -2 -1 -4 -1 -3 -3 -1 -1 1 M 1 -4 -4 1 -2 -2 -2 -2 -4 -1 -3 -1 -1 -3 -1 -4 B -4 -1 -1 -1 -1 -3 -3 -1 -1 -3 -1 -2 -2 -2 -1 -1 V -1 -4 -1 -1 -1 -3 -1 -3 -3 -1 -2 -1 -2 -2 -1 -4 H -1 -1 -4 -1 -3 -1 -3 -1 -3 -1 -2 -2 -1 -2 -1 -1 D -1 -1 -1 -4 -3 -1 -1 -3 -1 -3 -2 -2 -2 -1 -1 -1 N -2 -2 -2 -2 -1 -1 -1 -1 -1 -1 -1 -1 -1 -1 -1 -2 U -4 5 -4 -4 -4 1 -4 1 1 -4 -1 -4 -1 -1 -2 5
  • 14. • • • • • • • • • • •
  • 15.
  • 16. #!/bin/bash for i in *.fasta.result;do n=`echo $i | sed 's/..*//'` echo $n url=`ruby blastparse.rb $n.fasta.result` case $url in http*) echo $url curl -s -o $n.genome.fasta $url ~/bin/EMBOSS-5.0.0/emboss/dotmatcher $n.genome.fasta $n.fasta -graph ps -threshold 35 -goutfile $n.fasta convert $n.fasta.ps $n.fasta.png ;; esac done 10 http://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi? db=genome&id=NC_001142.1&seq_start=722530&seq_stop=723085&strand =2&rettype=fasta Displays a thresholded dotplot of two sequences Created 10.fasta.ps 101 http://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi? db=genome&id=NC_001146.1&seq_start=57506&seq_stop=57900&strand=1 &rettype=fasta Displays a thresholded dotplot of two sequences Created 101.fasta.ps
  • 17. • • • 1. 2. 3. 4. • •