Professional Documents
Culture Documents
FACULTY OF AGRICULTURE
BSc (Hons) Biotechnology
#Question 1 a
#Question 1 b
length sequence = len (chain_a) - chain_a.count ("\n")
print (length sequence: ", length)
#Question 1 c
new_chain = chain_a.replace("\n", "")
print("New Chain:",new_chain)
#Question 1 d
count = 0
result=0
for i in chain_a:
if i == 'C':
count = count + 1
print ("Number of C:",count)
#Question 1 e
if "NLRVEYLDDRN" in chain_a:
print("yes found");
pos= chain_a.find("NLRVEYLDDRN")
print("Starting position :",pos);
Question 2
dna_seq = """GGGCTTGTGGCGCGAGCTTCTGAAACTAGGCGGCAGAGGCGGAGCCGCT
GTGGCACTGCTGCGCCTCTGCTGCGCCTCGGGTGTCTTTT
GCGGCGGTGGGTCGCCGCCGGGAGAAGCGTGAGGGGACAG
ATTTGTGACCGGCGCGGTTTTTGTCAGCTTACTCCGGCCA AAAAAGAACTGCACCTCTGGAGCGG""
#Question 2 a
#Question 2 b
rna_seq = dna_seq.replace("T","U")
#Question 2 c
intron = dna_seq[50:156]
exon1 = dna_seq[0:50]
exon2 = dna_seq[156:]
spliced = exon1+exon2
Question 3
#Question 3 a
clusters = """\
>Cluster 0
0 >YLR106C at 100.00%
>Cluster 50
0 >YPL082C at 100.00%
>Cluster 54
0 >YHL009W-A at 90.80%
1 >YHL009W-B at 100.00%
2 >YJL113W at 98.77%
3 >YJL114W at 97.35%
>Cluster 52
0 >YBR208C at 100.00%
"""
#Question a
result = re.findall(r">Cluster?([ \d.]+)", clusters, re.IGNORECASE |
re.MULTILINE)
#print("ID :",str(result))
#Question b
r = clusters.replace('>Cluster', 'Test')
#print("New :",r)
result = re.findall(r"> ?([A-Za-z0-9-]+)", r, re.IGNORECASE |
re.MULTILINE)
#print("sd :",str(result))
lines = r.split('\n')
#print(lines)
for line in lines:
print(re.findall(r"> ?([A-Za-z0-9-]+)", line, re.IGNORECASE |
re.MULTILINE) + re.findall(r"at ?([\d.]+)", line, re.IGNORECASE |
re.MULTILINE))
#Question 4
#Question 4 b
contains_2 = 2 in ratios.values()
print contains_2
contains_3 = 3 in ratios.values()
print contains_3
#Question 4 d
2 in ("A", "T"):
print (("A", "T"), 2) in ratios.items()
#Question 4 e
keys = [key_value[0]
for key_value in ratios.items()]
values = [key_value[-1]
for key_value in ratios.items()]
#Question 5
translation=
str = " ade tym tym ade gua tym cyt "
s = ['A, T, T, A, G, T, C ', 'for', ' ade, tym, tym, ade, gua, tym, cyt ']
print(listToString(s))
#Question 6
text=""">2HMI:A|PDBID|CHAIN|SEQUENCE
PISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKI
>2HMI:B|PDBID|CHAIN|SEQUENCE
PISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKI
>2HMI:C|PDBID|CHAIN|SEQUENCE
DIQMTQTTSSLSASLGDRVTISCSASQDISSYLNWYQQKPEGTVKLLIYY
>2HMI:D|PDBID|CHAIN|SEQUENCE
QITLKESGPGIVQPSQPFRLTCTFSGFSLSTSGIGVTWIRQPSGKGLEWL
>2HMI:E|PDBID|CHAIN|SEQUENCE
ATGGCGCCCGAACAGGGAC
>2HMI:F|PDBID|CHAIN|SEQUENCE
GTCCCTGTTCGGGCGCCA"""
fastaFile = open('fasta_file.txt')