python生物信息学数据管理自测题3.5

2018-08-10  本文已影响0人  tianzhanlan
#自测题3.1
#读取和写入文件
#以list的形式写入到neuron_data1.txt中
open('neuron_data1.txt','w').writelines(open('neuron_data.txt','r').readlines())
#以str的形式写入到neuron_data3.txt
data = []
with open('neuron_data.txt','r') as h:
    for i in h:
        print(type(i))
        j = i.strip()
        data.append(j)
        print(type(data))
content = '\n'.join(data)
with open('neuron_data2.txt','w') as k:
    k.write(content)

data = []
for l in open('neuron_data.txt','r'):
    data.append(l.strip())
open('neuron_data3.txt','w').write('\n'.join(data))
#自测题3.2
#计算平均值和标准差
import math
total = 0.0
data =[]
for line in open('neuron_data.txt'):
    length = float(line.strip())
    data.append(length)
print(type(data))
average = sum(data)/len(data)
for value in data:
    total +=(value - average)**2
stddev = math.sqrt(total/len(data))
print(average,stddev)
#自测题3.3
#核苷酸的频率
data = []
with open('sequence.txt','r') as s:
    sequence = s.read()
    for i in 'ATCG':
        number = sequence.count(i)
        data.append(number)
print(max(data))
#自测题3.4
#DNA序列的GC含量
with open('sequence.txt','r') as s:
    sequence = s.read()
gc = (sequence.count('G')+sequence.count('C'))/len(sequence)
print(str(gc*100)+'%')
#自测题3.5
#将自测题3.3和3.4的结果写入文本文件
with open('result.txt','w') as f:
    f.write(str(max(data))+'\n'+ str(gc*100)+'%')

请关注我的公众号----生信栈,不定期分享实用的生物信息干货!!!

上一篇 下一篇

猜你喜欢

热点阅读