0% found this document useful (0 votes)

319 views

BioInfo2 Assignment - Python

The document describes the process of translating DNA into proteins. It involves: 1. Transcribing DNA into RNA 2. Translating RNA into amino acids by reading the RNA codons in groups of three 3. Defining functions to translate the six reading frames of DNA and its complement to find all possible proteins

Uploaded by

Jin Yeow

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

319 views

BioInfo2 Assignment - Python

Uploaded by

Jin Yeow

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 11

#Task 1: Translating DNA into proteins.

#a. First transcribe DNA to RNA

#b. Translate RNA to amino acids

from string import * //Importing string library

seq = raw_input ("Enter a seqeunce : ") //Create sequence input

print ""

seq=seq.upper() //change input sequence to uppercase by ‘.upper()’.

table = { //initialize amino acid dictionary

'UUU': 'F', 'UUC': 'F', 'UUA': 'L', 'UUG': 'L', 'UCU': 'S',

'UCC': 'S', 'UCA': 'S', 'UCG': 'S', 'UAU': 'Y', 'UAC': 'Y',

'UGU': 'C', 'UGC': 'C', 'UGG': 'W', 'CUU': 'L', 'CUC': 'L',

'CUA': 'L', 'CUG': 'L', 'CCU': 'P', 'CCC': 'P', 'CCA': 'P',

'CCG': 'P', 'CAU': 'H', 'CAC': 'H', 'CAA': 'Q', 'CAG': 'Q',

'CGU': 'R', 'CGC': 'R', 'CGA': 'R', 'CGG': 'R', 'AUU': 'I',

'AUC': 'I', 'AUA': 'I', 'AUG': 'M', 'ACU': 'T', 'ACC': 'T',

'ACA': 'T', 'ACG': 'T', 'AAU': 'N', 'AAC': 'N', 'AAA': 'K',

'AAG': 'K', 'AGU': 'S', 'AGC': 'S', 'AGA': 'R', 'AGG': 'R',

'GUU': 'V', 'GUC': 'V', 'GUA': 'V', 'GUG': 'V', 'GCU': 'A',

'GCC': 'A', 'GCA': 'A', 'GCG': 'A', 'GAU': 'D', 'GAC': 'D',

'GAA': 'E', 'GAG': 'E', 'GGU': 'G', 'GGC': 'G', 'GGA': 'G',

'GGG': 'G', }
stop_codons = ['UAA', 'UAG', 'UGA'] //Initialize stop codon dictionary

for codon in stop_codons: //Loop to substitute stop codon with ‘*’.

table[codon] = "*"

protein = [] //List of array for proteins translated from every ORF

protein_complementary = []

protein_base1 = []

protein_complementary_base1 = []

protein_base2 = []

protein_complementary_base2 = []

protein_base3 = []

protein_complementary_base3 = []

for base in seq: //Checker for unknown bases

if base == "A":

number = 2

elif base == "G":

number = 2

elif base == "T":

number = 2

elif base == "C":

number = 2

else:

number = 1
if number == 1:

print "Error in the sequence, contain unknown bases"

exit(1)

c = maketrans("ATGC","UACG") //”maketrans()” function to convert sequence to RNA

t = maketrans("ATGC","TACG") //”maketrans()” function to convert sequence

//to complementary

complementary_DNA = seq.translate(t) // apply ‘t’ to create compliment dna

transcript_DNA = seq.translate(c) //apply ‘c’ to transcribe sequence

complementary_RNA = complementary_DNA.translate(c) //RNA of compliment DNA

transcript_complementary_DNA = complementary_RNA[::-1] //reverse compliment of RNA

def translate_dna(transcript_DNA): //function to translate sequence

for i in range(0, len(transcript_DNA)-len(transcript_DNA)%3, 3):

protein.append( table[transcript_DNA[i:i+3]] )

return "".join(protein)
def translate_dna_base1(transcript_DNA): //ORF1 translate with Stop codon include

for i in range(0, len(transcript_DNA)-len(transcript_DNA)%3, 3):

if transcript_DNA[i:i+3] == 'UAA':

protein_base1.append( table[transcript_DNA[i:i+3]] )

break

elif transcript_DNA[i:i+3] == 'UAG':

protein_base1.append( table[transcript_DNA[i:i+3]] )

break

elif transcript_DNA[i:i+3] == 'UGA':

protein_base1.append( table[transcript_DNA[i:i+3]] )

break

else:

protein_base1.append( table[transcript_DNA[i:i+3]] )

return " ".join(protein_base1)

def translate_complementary_base1(transcript_complementary_DNA):

//ORF4 translate with Stop codon include

for i in range(0, len(transcript_complementary_DNA)-len(transcript_complementary_DNA)

%3, 3):
if transcript_complementary_DNA[i:i+3] == 'UAA':

protein_complementary_base1.append( table[transcript_complementary_DNA[i:i+3]] )

break

elif transcript_complementary_DNA[i:i+3] == 'UAG':

protein_complementary_base1.append( table[transcript_complementary_DNA[i:i+3]] )

break

elif transcript_complementary_DNA[i:i+3] == 'UGA':

protein_complementary_base1.append( table[transcript_complementary_DNA[i:i+3]] )

break

else:

protein_complementary_base1.append( table[transcript_complementary_DNA[i:i+3]] )

return " ".join(protein_complementary_base1)

def translate_dna_base2(transcript_DNA): //ORF2 translate with Stop codon include

for i in range(1, ((len(transcript_DNA)-1)-(len(transcript_DNA)-1)%3), 3):

if transcript_DNA[i:i+3] == 'UAA':

protein_base2.append( table[transcript_DNA[i:i+3]] )

break
elif transcript_DNA[i:i+3] == 'UAG':

protein_base2.append( table[transcript_DNA[i:i+3]] )

break

elif transcript_DNA[i:i+3] == 'UGA':

protein_base2.append( table[transcript_DNA[i:i+3]] )

break

else:

protein_base2.append( table[transcript_DNA[i:i+3]] )

return " ".join(protein_base2)

def translate_complementary_base2(transcript_complementary_DNA):

//ORF5 translate with Stop codon include

for i in range(1, ((len(transcript_complementary_DNA)-1)-

(len(transcript_complementary_DNA)-1)%3), 3):

if transcript_complementary_DNA[i:i+3] == 'UAA':

protein_complementary_base2.append( table[transcript_complementary_DNA[i:i+3]] )

break

elif transcript_complementary_DNA[i:i+3] == 'UAG':

protein_complementary_base2.append( table[transcript_complementary_DNA[i:i+3]] )
break

elif transcript_complementary_DNA[i:i+3] == 'UGA':

protein_complementary_base2.append( table[transcript_complementary_DNA[i:i+3]] )

break

else:

protein_complementary_base2.append( table[transcript_complementary_DNA[i:i+3]] )

return " ".join(protein_complementary_base2)

def translate_dna_base3(transcript_DNA): //ORF3 translate with Stop codon include

for i in range(2, ((len(transcript_DNA)-2)-(len(transcript_DNA)-2)%3), 3):

if transcript_DNA[i:i+3] == 'UAA':

protein_base3.append( table[transcript_DNA[i:i+3]] )

break

elif transcript_DNA[i:i+3] == 'UAG':

protein_base3.append( table[transcript_DNA[i:i+3]] )

break

elif transcript_DNA[i:i+3] == 'UGA':

protein_base3.append( table[transcript_DNA[i:i+3]] )
break

else:

protein_base3.append( table[transcript_DNA[i:i+3]] )

return " ".join(protein_base3)

def translate_complementary_base3(transcript_complementary_DNA):

//OR6 translate with Stop codon include

for i in range(2, ((len(transcript_complementary_DNA)-2)-

(len(transcript_complementary_DNA)-2)%3), 3):

if transcript_complementary_DNA[i:i+3] == 'UAA':

protein_complementary_base3.append( table[transcript_complementary_DNA[i:i+3]] )

break

elif transcript_complementary_DNA[i:i+3] == 'UAG':

protein_complementary_base3.append( table[transcript_complementary_DNA[i:i+3]] )

break

elif transcript_complementary_DNA[i:i+3] == 'UGA':

protein_complementary_base3.append( table[transcript_complementary_DNA[i:i+3]] )

break
else:

protein_complementary_base3.append( table[transcript_complementary_DNA[i:i+3]] )

return " ".join(protein_complementary_base3)

//Calling of function and interface output

print "Transcription of the DNA sequence: ", transcript_DNA

print "The complementary of the DNA sequence is: ", complementary_DNA

print "The transcription of complementary DNA sequence is: ", transcript_complementary_DNA

print ""

print "* stand for the stop codon"

print ""

translate_dna(transcript_DNA)

pro = " "

pro = pro.join(protein) // ’.join()’ is to create strings of output

print "The translation of the DNA is: ",pro

print ""

translate_dna_base1(transcript_DNA)

translate_complementary_base1(transcript_complementary_DNA)

pro = " "

pro = pro.join(protein_base1)

print "Translation start from the 1st base is : ", pro

pro = " "

pro = pro.join(protein_complementary_base1)

print "The translation start from the 1st base of complementary RNA is: ",pro

print ""

translate_dna_base2(transcript_DNA)

translate_complementary_base2(transcript_complementary_DNA)

pro = " "

pro = pro.join(protein_base2)

print "Translation start from the 2nd base is : ", pro

pro = " "

pro = pro.join(protein_complementary_base2)

print "The translation start from the 2nd base of complementary RNA is: ",pro

print ""

translate_dna_base3(transcript_DNA)

translate_complementary_base3(transcript_complementary_DNA)

pro = " "

pro = pro.join(protein_base3)
print "Translation start from the 3rd base is : ", pro

pro = " "

pro = pro.join(protein_complementary_base3)

print "The translation start from the 3rd base of complementary RNA is: ",pro

Joanna R. Freeland - Molecular Ecology-Wiley (2020)
No ratings yet
Joanna R. Freeland - Molecular Ecology-Wiley (2020)
686 pages
Transcription and Translation Worksheet
100% (2)
Transcription and Translation Worksheet
3 pages
Transcription and Translation Worksheet 2
50% (2)
Transcription and Translation Worksheet 2
2 pages
Python_Basics_Exercises
No ratings yet
Python_Basics_Exercises
4 pages
Python
No ratings yet
Python
9 pages
Faculty of Engineering Ain Shams University Name: Ahmed Nashaat Hassanen Department: CESS Bioinformatics ID: 14P6016 Ass1
No ratings yet
Faculty of Engineering Ain Shams University Name: Ahmed Nashaat Hassanen Department: CESS Bioinformatics ID: 14P6016 Ass1
3 pages
In-Linear-Time: Check This Web Site
No ratings yet
In-Linear-Time: Check This Web Site
4 pages
Q04 - Protein Translation - 30 Marks
No ratings yet
Q04 - Protein Translation - 30 Marks
3 pages
solutionsExerciseMaster11 23
No ratings yet
solutionsExerciseMaster11 23
13 pages
The Original Sequence Provided Is
No ratings yet
The Original Sequence Provided Is
2 pages
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
MOOC Project Work - Sequence Analysis - Data Analysis With Python 2021
No ratings yet
MOOC Project Work - Sequence Analysis - Data Analysis With Python 2021
29 pages
p3 Python Project
No ratings yet
p3 Python Project
4 pages
Manual de Ejercicios de Python
No ratings yet
Manual de Ejercicios de Python
1 page
BIO Code Report
No ratings yet
BIO Code Report
6 pages
Ass 2 Bioinformatics
No ratings yet
Ass 2 Bioinformatics
8 pages
INFO390C DNDS Pset05
No ratings yet
INFO390C DNDS Pset05
9 pages
University of Mauritius
No ratings yet
University of Mauritius
9 pages
Introduction to PHP, Part 2, Second Edition
From Everand
Introduction to PHP, Part 2, Second Edition
Adam Majczak
No ratings yet
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
From Everand
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
Manish Soni
No ratings yet
IDC306_Assignment_5_MS21009
No ratings yet
IDC306_Assignment_5_MS21009
4 pages
L3
No ratings yet
L3
48 pages
Protein_Synthesis_Problem
No ratings yet
Protein_Synthesis_Problem
2 pages
Eac - Protein Synthesis Worksheet
No ratings yet
Eac - Protein Synthesis Worksheet
3 pages
Lab 3
No ratings yet
Lab 3
2 pages
p2 Python Project
No ratings yet
p2 Python Project
3 pages
Assignment 01
No ratings yet
Assignment 01
4 pages
Unit 6 Practice-1
No ratings yet
Unit 6 Practice-1
1 page
UNIX Shell Programming Interview Questions You'll Most Likely Be Asked
From Everand
UNIX Shell Programming Interview Questions You'll Most Likely Be Asked
Vibrant Publishers
No ratings yet
Tut3 2022
No ratings yet
Tut3 2022
4 pages
Assignment 1
No ratings yet
Assignment 1
5 pages
g10 Protein Synthesis 2023
No ratings yet
g10 Protein Synthesis 2023
1 page
1009169194
No ratings yet
1009169194
17 pages
Amazing Java: Learn Java Quickly
From Everand
Amazing Java: Learn Java Quickly
Andrei Besedin
No ratings yet
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Bioinformatics HW1
No ratings yet
Bioinformatics HW1
3 pages
Exercises - Genetics - USTH2022 Hint To Research
No ratings yet
Exercises - Genetics - USTH2022 Hint To Research
18 pages
The Central Dogma of Molecular Biology
100% (1)
The Central Dogma of Molecular Biology
5 pages
150+ C Pattern Programs
From Everand
150+ C Pattern Programs
Hernando Abella
No ratings yet
HW 13
No ratings yet
HW 13
6 pages
BT3040 - BIOINFORMATICS - Assignment 4: Question 1
No ratings yet
BT3040 - BIOINFORMATICS - Assignment 4: Question 1
9 pages
Polypeptide an Sers
No ratings yet
Polypeptide an Sers
2 pages
Hasil Proyek Elisa
No ratings yet
Hasil Proyek Elisa
9 pages
Bio Python 202111
No ratings yet
Bio Python 202111
63 pages
Activity Protein Synthesis
No ratings yet
Activity Protein Synthesis
2 pages
Balauro Worksheet Protein Synthesis
100% (1)
Balauro Worksheet Protein Synthesis
4 pages
Tutorial Solution Chapter 1+2+3
No ratings yet
Tutorial Solution Chapter 1+2+3
28 pages
Genetic Code Worksheet
No ratings yet
Genetic Code Worksheet
3 pages
BioCentralDogmaWorksheet 1
No ratings yet
BioCentralDogmaWorksheet 1
3 pages
Sequence Listing
No ratings yet
Sequence Listing
11 pages
CSE 5370: Bioinformatics Homework 2: Due Thursday, February 24th, 2022 at 4:59PM CST
No ratings yet
CSE 5370: Bioinformatics Homework 2: Due Thursday, February 24th, 2022 at 4:59PM CST
3 pages
Unit 1-Enzyme Protein Syntheis Questions
100% (2)
Unit 1-Enzyme Protein Syntheis Questions
58 pages
vertopal.com_bioinf575_hw07_dmeghana (1)
No ratings yet
vertopal.com_bioinf575_hw07_dmeghana (1)
34 pages
DNA Replication Transcription and Translation
No ratings yet
DNA Replication Transcription and Translation
2 pages
Act01_OpenReadingFrames
No ratings yet
Act01_OpenReadingFrames
8 pages
CMB Activity 3
No ratings yet
CMB Activity 3
2 pages
Molecular Basis And Biodiversity class 12
No ratings yet
Molecular Basis And Biodiversity class 12
63 pages
Answers
No ratings yet
Answers
6 pages
04-Molecular basis of inheritance
No ratings yet
04-Molecular basis of inheritance
4 pages
Rust Package 100 Knocks: One-Hour Mastery Series 2024 Edition
From Everand
Rust Package 100 Knocks: One-Hour Mastery Series 2024 Edition
Kanto
No ratings yet
Lab 7 Transcription Translation 2
No ratings yet
Lab 7 Transcription Translation 2
5 pages
project
No ratings yet
project
29 pages
Summary 4º ESO - Unit 3 - Genetic Information and Nucleic Acids
No ratings yet
Summary 4º ESO - Unit 3 - Genetic Information and Nucleic Acids
89 pages
Day 3 - Transcription and RNA Processing
No ratings yet
Day 3 - Transcription and RNA Processing
50 pages
Translation Transcription Flinn Activity
No ratings yet
Translation Transcription Flinn Activity
3 pages
Rna and Its Structure, Function and Types
No ratings yet
Rna and Its Structure, Function and Types
12 pages
Chemical Technician - Preliminary Board Exam
100% (2)
Chemical Technician - Preliminary Board Exam
11 pages
DNA Worksheet
No ratings yet
DNA Worksheet
5 pages
Gateway Cloning Manual
No ratings yet
Gateway Cloning Manual
63 pages
Eukaryotic Cell Definition
No ratings yet
Eukaryotic Cell Definition
5 pages
Protein Synthesis Homework Answers
100% (1)
Protein Synthesis Homework Answers
5 pages
Membranes, Proteins, DNA and Gene Expression
No ratings yet
Membranes, Proteins, DNA and Gene Expression
15 pages
Daily Lesson Log: A. References
No ratings yet
Daily Lesson Log: A. References
5 pages
A Level Biology Topic 4 Notes
No ratings yet
A Level Biology Topic 4 Notes
41 pages
Central Dogma
No ratings yet
Central Dogma
4 pages
Structure of Ribosomes
100% (1)
Structure of Ribosomes
15 pages
BACE Exam 3.0 Biochemistry-Chemistry v5
No ratings yet
BACE Exam 3.0 Biochemistry-Chemistry v5
25 pages
Worksheet in Science 10 Q3 Module 4
No ratings yet
Worksheet in Science 10 Q3 Module 4
2 pages
Models of Life
No ratings yet
Models of Life
353 pages
Garbage Dumping Is Not A Good Idea
No ratings yet
Garbage Dumping Is Not A Good Idea
15 pages
Chapter 12 Glencoe Biology Study Guide
No ratings yet
Chapter 12 Glencoe Biology Study Guide
11 pages
Genetics: Analysis & Principles 6th Edition Robert J. Brooker All Chapter Instant Download
100% (5)
Genetics: Analysis & Principles 6th Edition Robert J. Brooker All Chapter Instant Download
53 pages
(Ebook) Study Guide for Understanding Pathophysiology by Sue E. Huether, Kathryn L. McCance & Kathryn L. McCance ISBN 9780323084895, 9789996088346, 9996088340, 0323084893 instant download
100% (2)
(Ebook) Study Guide for Understanding Pathophysiology by Sue E. Huether, Kathryn L. McCance & Kathryn L. McCance ISBN 9780323084895, 9789996088346, 9996088340, 0323084893 instant download
30 pages
Essential Cell Biology 5th Edition Bruce Alberts - The latest ebook is available for instant download now
100% (2)
Essential Cell Biology 5th Edition Bruce Alberts - The latest ebook is available for instant download now
57 pages
2023 Fy13ce Biology Detailed Solution PDF
No ratings yet
2023 Fy13ce Biology Detailed Solution PDF
32 pages
Basic Concepts in Genetics and Common Genetic Disorders
No ratings yet
Basic Concepts in Genetics and Common Genetic Disorders
88 pages
Biology Esei STPM 2017@ 2018
100% (1)
Biology Esei STPM 2017@ 2018
43 pages
Quiz On Central Dogma - BIOCHEMISTRY
No ratings yet
Quiz On Central Dogma - BIOCHEMISTRY
13 pages
01 - Intro To Central Dogma and Structure of DNA-RNA PDF
100% (1)
01 - Intro To Central Dogma and Structure of DNA-RNA PDF
5 pages
Study Guide A: Key Concept
No ratings yet
Study Guide A: Key Concept
17 pages

BioInfo2 Assignment - Python

Uploaded by

BioInfo2 Assignment - Python

Uploaded by

#Task 1: Translating DNA into proteins.

#a. First transcribe DNA to RNA

#b. Translate RNA to amino acids

from string import * //Importing string library

seq = raw_input ("Enter a seqeunce : ") //Create sequence input

seq=seq.upper() //change input sequence to uppercase by ‘.upper()’.

table = { //initialize amino acid dictionary

for codon in stop_codons: //Loop to substitute stop codon with ‘*’.

protein = [] //List of array for proteins translated from every ORF

for base in seq: //Checker for unknown bases

elif base == "G":

elif base == "T":

elif base == "C":

print "Error in the sequence, contain unknown bases"

c = maketrans("ATGC","UACG") //”maketrans()” function to convert sequence to RNA

t = maketrans("ATGC","TACG") //”maketrans()” function to convert sequence

complementary_DNA = seq.translate(t) // apply ‘t’ to create compliment dna

transcript_DNA = seq.translate(c) //apply ‘c’ to transcribe sequence

complementary_RNA = complementary_DNA.translate(c) //RNA of compliment DNA

transcript_complementary_DNA = complementary_RNA[::-1] //reverse compliment of RNA

def translate_dna(transcript_DNA): //function to translate sequence

for i in range(0, len(transcript_DNA)-len(transcript_DNA)%3, 3):

for i in range(0, len(transcript_DNA)-len(transcript_DNA)%3, 3):

elif transcript_DNA[i:i+3] == 'UAG':

elif transcript_DNA[i:i+3] == 'UGA':

return " ".join(protein_base1)

//ORF4 translate with Stop codon include

for i in range(0, len(transcript_complementary_DNA)-len(transcript_complementary_DNA)

elif transcript_complementary_DNA[i:i+3] == 'UAG':

elif transcript_complementary_DNA[i:i+3] == 'UGA':

return " ".join(protein_complementary_base1)

def translate_dna_base2(transcript_DNA): //ORF2 translate with Stop codon include

for i in range(1, ((len(transcript_DNA)-1)-(len(transcript_DNA)-1)%3), 3):

elif transcript_DNA[i:i+3] == 'UGA':

return " ".join(protein_base2)

//ORF5 translate with Stop codon include

for i in range(1, ((len(transcript_complementary_DNA)-1)-

elif transcript_complementary_DNA[i:i+3] == 'UAG':

elif transcript_complementary_DNA[i:i+3] == 'UGA':

return " ".join(protein_complementary_base2)

def translate_dna_base3(transcript_DNA): //ORF3 translate with Stop codon include

for i in range(2, ((len(transcript_DNA)-2)-(len(transcript_DNA)-2)%3), 3):

elif transcript_DNA[i:i+3] == 'UAG':

elif transcript_DNA[i:i+3] == 'UGA':

return " ".join(protein_base3)

//OR6 translate with Stop codon include

for i in range(2, ((len(transcript_complementary_DNA)-2)-

elif transcript_complementary_DNA[i:i+3] == 'UAG':

elif transcript_complementary_DNA[i:i+3] == 'UGA':

return " ".join(protein_complementary_base3)

//Calling of function and interface output

print "Transcription of the DNA sequence: ", transcript_DNA

print "The complementary of the DNA sequence is: ", complementary_DNA

print "The transcription of complementary DNA sequence is: ", transcript_complementary_DNA

print "* stand for the stop codon"

pro = " "

pro = pro.join(protein) // ’.join()’ is to create strings of output

print "The translation of the DNA is: ",pro

pro = " "

print "Translation start from the 1st base is : ", pro

pro = " "

pro = " "

print "Translation start from the 2nd base is : ", pro

pro = " "

pro = " "

pro = " "

You might also like