forked from xuyk/Rosalind
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy path066_CSTR.py
39 lines (30 loc) · 1.18 KB
/
066_CSTR.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
#!/usr/bin/env python
'''
A solution to a ROSALIND bioinformatics problem.
Problem Title: Creating a Character Table from Genetic Strings
Rosalind ID: CSTR
Rosalind #: 066
URL: http://rosalind.info/problems/cstr/
'''
def char_table_from_strings(dna_list):
'''Builds a character table from a given list of strings.'''
ch_table = set()
for i, ch in enumerate(dna_list[0]):
# Mark the on/off taxa based on the ith character of each sequence.
ch_array = [int(dna[i] == ch) for dna in dna_list]
if 1 < sum(ch_array) < len(dna_list)-1: # Check nontrivial.
ch_table.add(''.join(map(str,ch_array)))
return ch_table
def main():
'''Main call. Reads, runs, and saves problem specific data.'''
# Read the input data.
with open('data/rosalind_cstr.txt') as input_data:
dna_list = [line.strip() for line in input_data.readlines()]
# Get the character table.
character_table = char_table_from_strings(dna_list)
# Print and save the answer.
print '\n'.join(character_table)
with open('output/066_CSTR.txt', 'w') as output_data:
output_data.write('\n'.join(character_table))
if __name__ == '__main__':
main()