blob: b558fe2479027be57fc3f2d752d812e0d073ccfd (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
|
reads = $(inputs.readsFA)
subjects = $(inputs.subjects)
relabeled_fasta = open("relabeledSeqs.fasta", "wt")
original_labels = open("originalLabels.ttl", "wt")
for i, r in enumerate(reads):
with open(r["path"], "rt") as fa:
label = fa.readline()
original_labels.write("<%s> <http://biohackathon.org/bh20-seq-schema/original_fasta_label> \\"%s\\" .\\n" % (subjects[i], label[1:].strip().replace('"', '\\\\"')))
relabeled_fasta.write(">"+subjects[i]+"\\n")
data = fa.read(8096)
while data:
relabeled_fasta.write(data)
data = fa.read(8096)
|