Skip to content
Permalink
83460e9671
Switch branches/tags

Name already in use

A tag already exists with the provided branch name. Many Git commands accept both tag and branch names, so creating this branch may cause unexpected behavior. Are you sure you want to create this branch?
Go to file
 
 
Cannot retrieve contributors at this time
53 lines (46 sloc) 2.13 KB
import os.path
from Modules.Ensembl.ActivityTableGenerator import ATGenerator
class ActivityTable:
"""
Class for checking activity_table and generating them.
activityTable = byte Representation of activity status
corresponding to the generator schema default:
0, "activity=ACTIVE",
1, "activity=POISED",
2, "activity=REPRESSED",
3, "activity=INACTIVE",
4, "activity=NA"
"""
def __init__(self, organism, current_release, wd, data_dir):
if data_dir:
self.link = os.path.join(data_dir + "/EnsemblData/", current_release, organism, "activity")
else:
self.link = os.path.join(wd + "/data/EnsemblData/", current_release, organism, "activity")
self.folders = next(os.walk(self.link))[1]
self.generator = ATGenerator(["activity=ACTIVE",
"activity=POISED",
"activity=REPRESSED",
"activity=INACTIVE",
"activity=NA"])
def check_and_generate_activity_table(self):
# checks if file already exists and generates new one if missing
for subfolder in self.folders:
folder_link = os.path.join(self.link, subfolder)
sf_link = os.path.join(folder_link, "table.bin")
if not os.path.isfile(sf_link):
print("No ActivityTable for "+subfolder+" found, generating new one.")
self.generate_table(folder_link)
print("All ActivityTables found, proceeding")
def generate_table(self, link):
# generates the table and saves it as table.bin file
for root, dirs, files in os.walk(link):
for file in files:
if file.endswith(".gff.gz"):
originpath = os.path.join(root, file)
file_path = os.path.join(root, "table.bin")
with open(file_path, "wb") as f:
f.write(self.generator.read_table(originpath))
print("New ActivityTable generated in: " + root)
# Debug
#e = ActivityTable("homo_sapiens", "release-94")
#e.check_and_generate_activity_table()