Skip to content

Commit

Permalink
added "_" separation in the third gtf-column in response to #29
Browse files Browse the repository at this point in the history
basti committed Jan 3, 2019
1 parent 39cdf16 commit 6016c18
Showing 2 changed files with 2 additions and 3 deletions.
3 changes: 1 addition & 2 deletions bin/3.1_create_gtf/Modules/Ensembl/GTFGen.py
Original file line number Diff line number Diff line change
@@ -51,7 +51,7 @@ def reformat_to_gff(self, activity, release):
# Add RegBuild_ + release
templist.append("RegBuild_"+release)
# Add Description from Description in last ; separated segment
templist.append(splitted_additional[4].split("=")[1].lower())
templist.append(splitted_additional[4].split("=")[1].lower().replace(' ', '_'))
# Add Start / End Data from original
templist.extend(splitted[3:5])
# Add Score, Strand and Frame Data
@@ -68,7 +68,6 @@ def reformat_to_gff(self, activity, release):
@staticmethod
def generate_additional_information(gene_id, activity):
# helper method to concat activity information to string
print(gene_id)
if gene_id.startswith("ID=regulatory_region:"):
gene_id = 'gene_id "'+gene_id.split(':')[1]+'"'
elif gene_id.startswith("ID=E"):
2 changes: 1 addition & 1 deletion bin/3.1_create_gtf/Modules/ucsc/ucsc.py
Original file line number Diff line number Diff line change
@@ -41,7 +41,7 @@ def read_gff_to_gtf(self):
sequence = []
sequence.append(row[0])
sequence.append("UCSC")
sequence.append(row[3].lower())
sequence.append(row[3].lower().replace(' ', '_'))
sequence.append(row[1])
sequence.append(row[2])
sequence.append(".")

0 comments on commit 6016c18

Please sign in to comment.