forked from Shivi91/Rosalind-1
-
Notifications
You must be signed in to change notification settings - Fork 14
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Maximizing the Gap Symbols of an Optimal Alignment
Solution to Rosalind Problem 083: Maximizing the Gap Symbols of an Optimal Alignment
- Loading branch information
Showing
3 changed files
with
227 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,65 @@ | ||
#!/usr/bin/env python | ||
''' | ||
A solution to a ROSALIND bioinformatics problem. | ||
Problem Title: Maximizing the Gap Symbols of an Optimal Alignment | ||
Rosalind ID: MGAP | ||
Rosalind #: 083 | ||
URL: http://rosalind.info/problems/mgap/ | ||
''' | ||
# --------------------------------------------------------------------------------------------- | ||
# SOLUTION COMMENTS AND EXPLANATION | ||
# --------------------------------------------------------------------------------------------- | ||
# This solution deserves more explanation than simple code comments, as the method to solve | ||
# the problem seemingly has nothing to do with what is stated in the problem statement. | ||
# | ||
# The key thing to notice in the problem statement is that we want an optimal alignment | ||
# and that there is no upper bound on the score associated with a match. Thus, we can | ||
# assign an arbitrarily high score to matches and ensure that the maximum score corresponds | ||
# to aligning the maximum number of symbols. | ||
# | ||
# The maximum number of aligned symbols between two sequences is precisely the longest common | ||
# subsequence, and determining the longest common subsequence is a problem that we've already | ||
# solved on Rosalind (it is a prerequiste problem for this one!). | ||
# | ||
# Now, since we have a free choice on the penalties associated with mismatches and gaps, | ||
# choose a lowerpenalty for gaps, and match all non-longest subsequence symbols with gaps. | ||
# Thus, we have one gap symbol for each nucleotide that is no part of the longest common | ||
# subsequence in each problem. | ||
# | ||
# So: max #Gaps = |seq1| + |seq2| - 2*|longest subsequence| | ||
# --------------------------------------------------------------------------------------------- | ||
|
||
from scripts import ReadFASTA | ||
|
||
|
||
def maximum_gap_symbols(v, w): | ||
'''Returns the max number of gap symbols in an optimal alignment of v and w.''' | ||
# Get the length of the longest common subsequence. | ||
M = [[0 for j in xrange(len(w)+1)] for i in xrange(len(v)+1)] | ||
for i in xrange(len(v)): | ||
for j in xrange(len(w)): | ||
if v[i] == w[j]: | ||
M[i+1][j+1] = M[i][j]+1 | ||
else: | ||
M[i+1][j+1] = max(M[i+1][j],M[i][j+1]) | ||
|
||
# Apply the aforementioned formula with the length of the longest subsequence. | ||
return len(v) + len(w) - 2*M[len(v)][len(w)] | ||
|
||
|
||
def main(): | ||
'''Main call. Reads, runs, and saves problem specific data.''' | ||
# Parse the input data. | ||
v, w = [fasta[1] for fasta in ReadFASTA('data/rosalind_mgap.txt')] | ||
|
||
# Get the maximum number of gaps. | ||
max_gaps = str(maximum_gap_symbols(v,w)) | ||
|
||
# Print and save the answer. | ||
print max_gaps | ||
with open('output/083_MGAP.txt', 'w') as output_data: | ||
output_data.write(max_gaps) | ||
|
||
if __name__ == '__main__': | ||
main() |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,161 @@ | ||
>Rosalind_0508 | ||
TTAGGTTAGGGAATTCTCCGCGTTTGCCCGCTCGTGGCATCCATCAGCGGCTTTATCTAC | ||
AAACATAGGACGACGCTGGAGCCGGTAATTCAGCAGAGCTACACAGCCCCTAGCTTCTCG | ||
GTATCCACGAAGTGTTACGCGGACCAACCATTACGTAGGAGTAGCCAATATCCATAGGTT | ||
TGGACATCAAAGTCGAGTAGATACTGATGTGTGGGGTAAGCAGAACGGACTCGAAAATCG | ||
CAGTGGGTCCAGGGACCATGGGCATCTAGGCGTTACCACCGTACTCACTCCGAACTAGCA | ||
TAACACACGGTCGGTATACTGGTAACCTCTCAAAACACTGGTCGGAAGGATGGTTCCGCT | ||
ATTAGATTATCGTGACTCTCCGTGTTAAACACCCACTAGTAATGCCTATCTTTCTACCGC | ||
TCGCTCAGACCAGTCTCCCGCGTACGGTTCTATGCAAAGGACGTAACAAGACCTAATTTA | ||
TGGGGTGTGTTTGACCTGGTCTGTCGTCACGCGTAGTCGTCGAGGGTGGTAGAACGATTG | ||
GTTAATGACTTATGCATAGAAGCACATCTGTCGGGTCCACAGCCATGGTGGTCTATGTTC | ||
AGACCAACACATGGCCCCAGCTGTGCTTTCCGGACGGGGAAATCTGGAATTCAGAACAGT | ||
GCAAATGTTCCCAATTACCAGGAAAGTAATTTTACCTAGGCTTGGGATACCGATGTAAAC | ||
GGGGCCGTGATGGTCCCGGAGATGCGTTTCGCTCATTTTTTGGCGGCTATAAAGCGTCTG | ||
TGAAACCGTGCACTATGTTTGTGCCGTCAGGAGGTCTCTGGACTTCTATGTTTGGCATAT | ||
TTAGTGACGGCATACCAGGAAGGAACAGGCCTTATTGCGTTGATGCCGGCACAACCCTGC | ||
GAAGGAGTGAAACTGCGGGTTGTGAATAAATGATCACCTGTTCAAGGTCGTTTGTCCCCT | ||
CAACTAAAAGACGGGGGATCCAAACACCTTCCTAGCCGATCAACTAAAGGTGCTTTGCTC | ||
ATCTTTACTTCGAACCCCCCGTTCGCATGCATACCTGCTTGCATCCACCCTCATTGATCT | ||
TCATTATTAACTATTAGGATGCAGATGGCATTGTTACTTTTCGTACAATCGGATACGCTA | ||
GGTGATACCATGTTTATGGCTGCAATCACTGGCTTACGCATGCTTTTACGTCACGGGCAA | ||
GACCCTATAAGATGTTCGCACCTCGCAATCGACTTCAGGGCTTGCGGCGTCAAGCTAGAG | ||
TCCGTTATAATCTTCCATTAGTTCGCCTGACGATTTCCCTACGTGCTGCCGTTAAGAGCC | ||
GCACGTGGAAGAGGAGAACAAGGAGTATTGCCTAAATGCCGTCAATAGCGAGGAATAGAC | ||
CTGCTATCGATGGACCTATGACGTCAAGCCGACATGTGACGTTAGATCTCGACCAATGGC | ||
CGAACGCTTCTCTCGCATGAGGTGCGCAGAACTTTACCGGTTAGTGCAGGACGTCCTAAT | ||
GTTGTCGTGCTGACGGCTACGGGATTAGAGGTTGGATTCATTCAAATCCTACCTAAGCAC | ||
CGCATAGAAATCCAACTGATCGACAGGTTCTACGGGGGGCTCTTTAGCACTAGCTGATAA | ||
AGCGACCTCTTTAACTCATTTCCAATCTTAACAGTCAGGAGAAGTTGATTCTGCATGCAT | ||
TAATTGGAAGGTGCCGCAAAGACTCTGCGCGTTTCCAAAGCTGACTAAGTTTCCCCAAAC | ||
AAATGATTTTATCGGATTGGAGCTGATCCTCAGTCCCGCACATCTTCGGGCGACCTCGCC | ||
CAGCTGTACAGTATATGACTTATCGTCGGGTCTTTTGCATCAACAACTTACGAGAAGCGT | ||
CGACATCCCACATGGTAATCCCCGCTAATATCGGTACGTAGTTGCAAGACGAGGTTTCCC | ||
GGCAGTCCATTTTGATGATTGAGTACTGTTCGAACCATCGATCGCCAGCACAGACGTTCG | ||
TCTCCCCCGGTACCAACAAACAATGTCATTCGAGTTGCACAGCGAACAAAATGCCCGGGC | ||
ATGGTAGACCAGTGATCTCCTTTTCCGACCGCTAGTATCGTTGTAACCAAACGCTCTATG | ||
GATATACGTGGGGCGACCGACAGAAGCTGTGTCGCTTCTAGAGGAGCGCGAAACACGTCT | ||
GATTTCATTTTCTTGACCCAAATCACTCCGTCGCGCCGCAAGTCGAAGATCTAGCCTCCT | ||
GCTAGTCCTAATATCTCAATAAAGGCAATCGTACCGAGGTGCCAGGCGCCGTCGTCGGCG | ||
ACATTAATGAGCGGTTCGATAAAACTCTATACGCCAGTGATGGCCTATCTACCCCGGGGC | ||
ATCCGCTCGACTTATTGAAGACAAAGGAATCCTTAAGCAAGCCTATTTAGTGATTAGCGC | ||
TGTGCGTGAATAGTCTGCGGCCACTGCTCGCGTTCAGCCGCCTCTCGCGGTGGGACTGAC | ||
GCCGCCAGCCCCATATGAATCATCGAGGTAAAGTAGCAATGTAGAACGTTAGATCGCGAC | ||
TATTGTACTGAAGCGACGCCAACAAGGGAAATCTTAGCTGCGGTCATTGATAAAGTCTCG | ||
CCCATCGAACCATAGCGTTTTTAGAGGAGCTAAGCTTGTCGAAACAGCTATTATTAAGCC | ||
AACCACGTATCTTAGGGTCCCCTGGCTCGCGTACCCATCTGCTCATAAACCCGTTGCGAA | ||
TAGAACCAGCACTATCCGATGCTTATAGAGTCGCCAGTACACCATGCATAATTCGTCGCC | ||
AAACCTGCGAGTTTAGAGTAGGATACTCTCAGAATCTTATTCACTTTTGCCGCCAGAGCC | ||
TCCAAGCGTATATTTACGAGAAGCGCAAAAGTTCGATGCCTGGGGAATATAACCTCCCAA | ||
ATGTAAGGCTATAGGGACCGACCAGTCTCCGCTCAAAGTGCTATTGGTGGTCGGTATAAA | ||
AACCCTCGTGTAGCACGTTCTTGTGCAATGATAATACCTGTATCGGGAGGCGTCATCAGC | ||
ACTGCCCGCGTATACCCGTAGTCTCTGCCATTCTTAATAATCAGCAGAGGTAACCAACAA | ||
GAACAGACCATGTACTTTGGCACACGCTGCTTGCACAGTTGACATCCGGGCCTTACCTTG | ||
ATGCCACCAAGAGGCTGCCCATTATGGAGCGTAGACCGGGCAGGGCCCGACTCTAGTTTA | ||
ATAGGATCATCGTAAGGGTATTTTCGATGCGGGCGTACTCCAGATTGCGTAACCGACCAC | ||
CGGGATTACGGCGCATGCGTCGGATTAAAACTCCCCTAAGGCCAACAAATCAGCACGGAG | ||
AAGTCCGTGACTTGGACAACACTGGCCGAATGCTTGTGAATTGCCGCCGTGTTCAAGACA | ||
TACCCGGGGTTGGCGACGACGCCATTGCGTGGCTCCATGAAAGTAGGACGCCGATACGAG | ||
AAATTGTGGACGCCAGAGTGCATCTCTCCCTATATTGAAACTTAAATTAAGTATCTTGTC | ||
TGGTTATCTCCTTCTCCGCTGCTTATAACCCTACATGGTATTGAAAGAGCTTATGCGCGA | ||
GTAGTGTGCCATACAATCTGTCAATTATTAAAACCGGCCAAAGCATAGAGGCCAACCAAT | ||
GACTGTTTAACTGACCGGTATGTACCGGTGGCACCCCAAGACCCGTTGTTATCAGCACTT | ||
GTATATCACCTGTCCTCGTATGCTTTATACGCGCCCAGGCGGGAATGGTAGCATCTGCAA | ||
GCTCTCAGTCATTTACGACGCATATGGGAACGTAGCTACTCGCTATGCTCCACGCACTTC | ||
ATAGCACGAATGAAGGATGGCAAACCCCCCGGGATGAACGAACTATACCATTGGGGCTTA | ||
CCTGTATAAGAGCGTGGAACACGTTGCGCTAGCTTTGTTGATCGCCATTATTTCAGTGTA | ||
CACGATCCCCTGTGACGTACGCATAAATTGATGTCGAACAAGACCCTCCTATTGGCAACT | ||
TCCATTAATCCCAAGATAATAATGCCACTGCCCAACTCCAAGCGGAAGATTCCGACTCTT | ||
CAGGTGTCGTTCCGGTTTTAGCTGCGTTTGAGGCAGCACTCACGCTTCGACATACTATCC | ||
ATGTTGCGATAGAGGTTTTACGCGTTTACATTCTGCTCGTCGATTAATTCAGCAGAAGAG | ||
ATCACGCAATGTAACCTTTCTGCCGAGCAAAGCCGTCGAACCCTGGGCGTTCGGATGACC | ||
GATGGTATATGGTCAGAATAATGAGCGAGCAGGACTACCTCGTCGATAGTTCGCTTAGAA | ||
GATCAATATGAGTCTAATACCTCCGTGCCTTCCCATCGGCTTATTACAGAGAACGTTCAT | ||
AGCGTACGGGGCATTCTGGTTCCAGCTATTATCGCCTTATGTCAGATAATCCATAGTACG | ||
ACGCGACCTATCGCATACCCCATCTTTTACGCCGACCCCTGGCAATGGTGCAACTGGGGG | ||
TCCAATTAGGTCAACGGTGGGACATTTTACGCCAGATACACTCCCGTGTTCCTACCATTA | ||
AGATTCGCTTCGAGGGAGCATCATTCTCGAGGTGTTCTCATAATCTACGATTTATTATAC | ||
CTATTAGTGCGAGTGTCGCGGCCGAAACATAGAAGAGGTACTGGGCCGAATTATAGAGGG | ||
ACGAGAACCCGAGACTCTAGCTACGATCGGCGTTATATAATGGCACACACGCCCGCTCAT | ||
AACCTCCTCTTCTACGACAGCCGGAGAGTCGGTCGAGCACCAGTTCAGGGTAACAAATGA | ||
TACGTGCCAGCGTACACTAGAAACCTTCTATCGCGTTAACTCTGTACCCCGAATATAGGC | ||
TTCGCTCGTGGAACCTTCACCCCCGTTCATTGGGCCCCCGCCGACGACATTGTTCAAGGG | ||
GCAATGTATGTAGAAGACTCACGCGCGTTAAACTACTCTACATTTTGCAGCAAAGTGCTA | ||
TTTAGGCATAACCGGTTATTCGGTTGTCACCCAGCTTAT | ||
>Rosalind_2416 | ||
TATTATATGGTCTTTTGTTAGTTATGACAGCCACGGGCAATAAATAGGCGACGCCGATAG | ||
GTATTTACAAATCATACGAAGGGCCGTCTGCCAGGCTCTACGGATCAAACCGAGAGTTAG | ||
ATGGTGGCGCATCGGGTAATCTTTCGCCGAAATTCGGGCGGGCTCTAAGGGTGACAGCGT | ||
CTATGTGGCCAGAGCTGCTGCATTCTTCATTGAATATGACTTAATATGTCAAGTCTTCTA | ||
TATGCATGAACTCTGCTAAGCAAGGCAAGGCTTGGCTTATATGTGCCTCCCATCACGTAC | ||
AATCCTCCCACAGGTGCGAGAACCTAGCGTGTGGGCACGCGTATGAAGGTGAATCTGACC | ||
GGGCACTCGCAATACGAACCCGCTCGAGAAGCATATAGTCCCGGCCCTGGCGAATTCTGT | ||
CTTGAGGTAGGAAAGTTTTCCATCCGGTGCCCCAACGACGGTAGGACATCTACCTTTAAG | ||
GTGCAACCACCGCCGAATTGAATCTCGTTAGGGTTTTCCGCTCTGTGCATATGACTGCCA | ||
CGGGAGAGGTATTTCCGCCATATAATCATGTGAGTCAAAGTCGACGTATCTAAACGCGTC | ||
AGCTGCAGCAAGGATGGCGGGTTAAGTAGCCTCACTGGTCCTTCGAGCAGATGACCTGGT | ||
GCTCTTGCTAAGCAGGAGCAACTCTGATCCGGCCATCGTGCATGAGGCTATTCGTAGTTT | ||
TCTTCCGCGCATTAAATAGCTAAGATGTCCATTAACCTTTAAGGAATTACTATCACTCAA | ||
GGATACGCGAATTTTTGTCTGAGGGACGACATAATGGCGAATTGGTTTGGGTCCTTAAGT | ||
TGGTCGGTAGCTTATAGTGCTCCCCAGCATATGAATATCGAGACGGGTGGTACTTGCATC | ||
TTATGTATCAGCTCCCGGTCGGTACTGTCAGAACCATTTTTCTAGATGGTCCCATCTTCG | ||
TGTCTGGTCGAGGGATGTCCGTCCGTCTTCTAATCGTTGTAATGGAGGTCACACAGAGGG | ||
CTAGAGAGGTTACGGTGGCACCGCATCGTATAGTGGCCGCCCCCAGGTCAGTGTAGATTA | ||
CAACGGCCCCGTACAGCGCACTAAATTCGGCACGTCGCTTTAAACACTCGCGATTAGCTT | ||
CACGAATATGCGCTGACACAAAAGTTAGCCAGTTTGAGACTATTTTTTCATGTATGTCTG | ||
AATGCTAGCCTCCTTGGTTGCCGAACGAACACTGGGGGCCCACATCTGATAACCCCGAAT | ||
AAAGGGATTACTTAAGCGTATGACCCCAAAACCGCGTGGTAAGGTTCAACGTACCGATAC | ||
ACGTGATACTTCGACGACTTGGGATTCCCCCTCTCAGAGTCCATGGTTGTCTTAATGAGA | ||
AAAAATATCATTAACGACGGTGGGGCAATACCATATTTCGCAGGTTGAGGCCAAGTATCC | ||
GAGGCGCATAAAACTTACTCCGTGAATACGGAGTTCGAACTTTGTCGAAATGCCCCTCGC | ||
TTTGATTCACTCATGTTGCACTGTAGGCGGAACGCCACCCTAGCAACTATTGCTCCCAGA | ||
CCGAGCTCGAACTCTAATATTGCATAACACCACGGTTTAATATGGGAATAGGCGGACGTT | ||
AAGAACCTCATTCGCACGATAGTTGGCTGCAGGACCACACTACGTCTTCCATATTGGACT | ||
AGCTTCAGTTTCACATGATTTAGGTATGCTATTAATGTAATAGCTGGGGGATTACCCTGG | ||
TCGATTCCAAGTGCTCCGCTATGGAGGCTGCGGCGCATATCTTAACCTGAACGTACCGTG | ||
GAGGTAGCCGCCCTACAAACGTCCCCCTAAGCTGTGGATTACTCCACAGGGATTAGGTGT | ||
GCCTTACTCTTTTAATGGGTCTCAGCCGTCTTCCGAGATATCCAGGTGGTTTTGGTAATC | ||
CGGTGCAAGAGTTAATAGAATCAGACCGGACCCAGACCCGAGTAGGCTCCTCTATTAGTT | ||
CGTTGGCGTTGTAAGCGAGTCTAAAGGGCCAGATATTAGAACGGTCCGCATCTGGTGTGA | ||
TAAGCTATTGAGGAAAGACGTCGCGCTCTTTCGGACTCTCGGCCGAATGCTAAAGCTTCT | ||
GTTCTTAATCTCATAGCTTTACACTCCTACTAGGTTCCCGCTGCAGGTTCAGGGGACGCA | ||
TAACGTTCAATGTGCAATGCGAAGCCCAGGAGTCTTCCCTTGAGGAATCCTTATTCGTGC | ||
ACCGGAGTGACCTCGGTGGCGTGAGCCCTACTAGCAAATTAACCTCATGAGATCTATTTG | ||
TAATATAGTCTTAGTGCGTGCGACACCTGAGCGCCCGATACAGTTCGGACCGTGTCACAA | ||
CATTGGGTAGTTCCATGTCTCAGGTGGCTCCGATTTTCAAATAATTCTGGTCGATCAACA | ||
AGGGACCTAGCAGTCTACCCCTGATTTTCGGCGGGAAGGTCGTTGTAGGCAGTGTTCTTC | ||
CACCCTAGTTTACAAGGAAGAGCCCAGCGAAGTAACTTTCAGTGAATCCCATCACTTCCA | ||
ATCATCAACGACACTTGCTTACACGTAGTCTGGGCGTGGAATGGTAGCTAACCATTCAAC | ||
ATCTTCGACTTTATAAGTTTATTTTGCCGTGGTTATTTAGCGTAGGACACAAAGCAGGAC | ||
TAAGACCTGCACTCCCCGACGTACTGCCGGCCGGACCGTGTTCATCTACGGGGATGTCCT | ||
ACATCGCACGAGATTTGCCACGAAGAGGCGCTTATCGGGTCGGGCATACCCTGGTGAACT | ||
ACCCGTTTCTTGGAACTTTCATTTCAGAGCATTCCTGACTGTCCCTTATTAACTCGATAA | ||
TCCATCCACACTCACTAATTGTGTCATCGGCAGCTCACTCATGGAGGTAGTATGGAAACC | ||
GATGGATAGTACCCTGTATTACCCGTCTGTAACTTTTTGCAGTATGAACGCTTGGTCGAG | ||
CAGCATAACTCGTACCTAAAGCTAGCCTAGCCTGACACTCAAGCGCACCGCTCTCAGACG | ||
GCCACCGTTTTGATGATGGTCTGTACACAGATACTTCCTACATGGATGTTACGTTAAAAG | ||
TAATTACTGTGTACTGCACTGGGTAATGGGCACAATGAGACTTATCATTCACCGCATCGG | ||
GCCTATCCACCATTCCTTACCTTGTACGTGACGGTACGCCACACTTATACGCTCTACGTG | ||
ATAAGGTCTCGAGGTCGTGCGTTCAACGAAGCGAGCCCAAACCAGCACTCAGGGAATCTT | ||
TTGCGCATAGGTGAAGAATTGGAATTAACAAGGTGGAGGTGACTGCACGACGTTCTGAGT | ||
CACTTACCGTAGTAAAAATAGAGACCAACCAAACTGGCTGATTACTTATTCAAAACCATG | ||
TGCTTCAATTTTCTGACGCCCCGCCCTGAAAAGCGTTAGCATGGCTACGGAGAGCTGCAT | ||
TGTGAAGGAGATGCGCGTTGAATCAAATTCGCCTGGACGAAAGTCGCGTCTCCCCCTAAT | ||
ATGCTAGCTAGCTTGTGATTCCTCATGTACTACTGGACCCTTGCCTTGCATCACTTAGTG | ||
CCCAAAGCGCGTACCTTTTTGTCCACCGATTTTAATAACGGCTACTTGAGAGTTTGGGGG | ||
GTAAAGGCCTGAAAGGCAGCGCTCTGATACGGTACCCTAGGGTGGTACCCGTAATACTTA | ||
AACATGTAAAGTTCGATCGTACCTTCGCTTATCGGCTGCCTCGACGGCAGAGTCACTCCG | ||
AGCGGTGCAGTGCGCCTCAACAGTAGGGGACTTTGTCTAAACGTAGGGACGCAATGATCT | ||
GGAGAATCGCGAGCATCTCTTCTATTTGGGATGCGGACTGGCTGCCCTGAAGGGCACAAT | ||
AATAGACCCTGCGTTGTAAATACGCCTATTAGACACGCATCCTCCCGTTATACGTTTTGT | ||
TCCCCCCACCATCTCCCAACCAGGCAGTCGTAAGCGTCGGAACCCGGTGCAGTTGTGAAT | ||
CAATTCACGGCTTGTTTAAGAATTAGTCAAGTAAGCCGACTGTTTCCAAGCTAAGGGAGT | ||
TGAACCAGGACATCGATTTTACAAGACAATTGCAGCTCCATCATCTTGAGATGCGCACGG | ||
AGTGGCGATAAAAAGCCAGTCGACACCCGCGAAAACCTCTATACGGCCCAGATCAGTCAC | ||
ACGGAGTCTGACAAGTAGCTTACGGCACTCCGGAATCACAAGAGCTCGGCTGATCTCGAG | ||
GGGCAGCTTTTATCTGACTTGTGCGTTTGGGGTACCAGACTGGCCTTGGGCTGAACGCAT | ||
GTGTCAGTGATGGCGGTGGTAGGCGGGAAAACGTGTCGGACTGACTACTGAAAGTCCAGA | ||
TTGTTCAGAGTCTACTAGTCTGGGGCGATTCTATGCAGCTGCACCGCGCATCCTACTGCA | ||
GACTAGATGATCGCGCCCTGGTCGACTAGGGCAGTGTCACCCCTTACTCACCATCCTCGA | ||
CATGGGCAAATGGTCTATGAGCGTGCTGTGCTGGCGCGGGAGAGCATAAGAAGCAAATTC | ||
CGAGACTTTCCACACACAGACCCCTCTGCTCGACCCCACGGAATGTACATCATT |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1 @@ | ||
3337 |