Jump to content

User:EvoProgrammer

From Wikipedia, the free encyclopedia
This is an old revision of this page, as edited by EvoProgrammer (talk | contribs) at 00:41, 21 May 2015. The present address (URL) is a permanent link to this revision, which may differ significantly from the current revision.

Human Genome Project

Python Source Code

def getCodonList():
	a = {}
	a['ATT'] = 'I'
	a['ATC'] = 'I'
	a['ATA'] = 'I'
	a['CTT'] = 'L' 
	a['CTC'] = 'L'
	a['CTA'] = 'L'
	a['CTG'] = 'L'
	a['TTA'] = 'L'
	a['TTG'] = 'L'
	a['GTT'] = 'V' 
	a['GTC'] = 'V'
	a['GTA'] = 'V'
	a['GTG'] = 'V'
	a['TTT'] = 'F'
	a['TTC'] = 'F'
	a['ATG'] = 'M'
	a['TGT'] = 'C'
	a['TGC'] = 'C'
	a['GCT'] = 'A' 
	a['GCC'] = 'A'
	a['GCA'] = 'A'
	a['GCG'] = 'A'
	a['GGT'] = 'G'
	a['GGC'] = 'G'
	a['GGA'] = 'G'
	a['GGG'] = 'G'
	a['CCT'] = 'P'
	a['CCC'] = 'P'
	a['CCA'] = 'P'
	a['CCG'] = 'P'
	a['ACT'] = 'T' 
	a['ACC'] = 'T'
	a['ACA'] = 'T'
	a['ACG'] = 'T'
	a['TCT'] = 'S'
	a['TCC'] = 'S'
	a['TCA'] = 'S'
	a['TCG'] = 'S'
	a['AGT'] = 'S'
	a['AGC'] = 'S'
	a['TAT'] = 'Y'
	a['TAC'] = 'Y'
	a['TGG'] = 'W'
	a['CAA'] = 'Q'
	a['CAG'] = 'Q'
	a['AAT'] = 'N'
	a['AAC'] = 'N'
	a['CAT'] = 'H'
	a['CAC'] = 'H'
	a['GAA'] = 'E'
	a['GAG'] = 'E'
	a['GAT'] = 'D'
	a['GAC'] = 'D'
	a['AAA'] = 'K'
	a['AAG'] = 'K'
	a['CGT'] = 'R'
	a['CGC'] = 'R'
	a['CGA'] = 'R'
	a['CGG'] = 'R'
	a['AGA'] = 'R'
	a['AGG'] = 'R'
	a['TAA'] = 'stop'
	a['TAG'] = 'stop'
	a['TGA'] = 'stop'
	return a

def getCodon(s):
	return str(getCodonList()[s])
def readDNA(s):
	if len(s) % 3 != 0:
		s = s[0:-(len(s)%3)]
	r = ""
	i = 0
	while i < len(s):
		r = r + getCodon(s[i:i+3])
		i += 3
	return r
	
#programe start
f = open('dna.txt','r+')
for line in f.readlines():
	print(readDNA(line))

File: dna.txt

ACATTTGCTTCTGACACAACTGTGTTCACTAGCAACCTCAAACAGACACCATGGTGCATCTGACTCCTGG
GGAGAAGTCTGCCGTTACTGCCCTGTGGGGCAAGGTGAACGTGGATGAAGTTGGTGGTGAGGCCCTGGGC
AGGCTGCTGGTGGTCTACCCTTGGACCCAGAGGTTCTTTGAGTCCTTTGGGGATCTGTCCACTCCTGATG
CTGTTATGGGCAACCCTAAGGTGAAGGCTCATGGCAAGAAAGTGCTCGGTGCCTTTAGTGATGGCCTGGC
TCACCTGGACAACCTCAAGGGCACCTTTGCCACACTGAGTGAGCTGCACTGTGACAAGCTGCACGTGGAT
CCTGAGAACTTCAGGCTCCTGGGCAACGTGCTGGTCTGTGTGCTGGCCCATCACTTTGGCAAAGAATTCA
CCCCACCAGTGCAGGCTGCCTATCAGAAAGTGGTGGCTGGTGTGGCTAATGCCCTGGCCCACAAGTATCA
CTAAGCTCGCTTTCTTGCTGTCCAATTTCTATTAAAGGTTCCTTTGTTCCCTAAGTCCAACTACTAAACT
GGGGGATATTATGAAGGGCCTTGAGCATCTGGATTCTGCCTAATAAAAAACATTTATTTTCATTGC