Source code for BLRun.pidcRunner

import os
import pandas as pd

from BLRun.runner import Runner


[docs]class PIDCRunner(Runner): """Concrete runner for the PIDC GRN inference algorithm."""
[docs] def generateInputs(self): ''' Function to generate desired inputs for PIDC. If the folder/files under self.input_dir exist, this function will not do anything. ''' # Create ExpressionData.csv file in the created input directory PIDC_EXPRESSION_FILE = self.working_dir / "ExpressionData.csv" if not PIDC_EXPRESSION_FILE.exists(): ExpressionData = pd.read_csv(self.input_dir / self.exprData, header = 0, index_col = 0) ExpressionData.to_csv(PIDC_EXPRESSION_FILE, sep = '\t', header = True, index = True)
[docs] def run(self): ''' Function to run PIDC algorithm ''' cmdToRun = ' '.join(['docker run --rm', f"-v {self.working_dir}:/usr/working_dir", f'{self.image} /bin/sh -c \"time -v -o', "/usr/working_dir/time.txt", 'julia runPIDC.jl', "/usr/working_dir/ExpressionData.csv", "/usr/working_dir/outFile.txt", '\"']) self._run_docker(cmdToRun)
[docs] def parseOutput(self): ''' Function to parse outputs from PIDC. ''' workDir = self.working_dir outFile = workDir / 'outFile.txt' # Quit if output file does not exist if not outFile.exists(): print(str(outFile) + ' does not exist, skipping...') return # Read output (headerless: col 0 = Gene1, col 1 = Gene2, col 2 = EdgeWeight) OutDF = pd.read_csv(outFile, sep = '\t', header = None) self._write_ranked_edges(pd.DataFrame({ 'Gene1': OutDF[0], 'Gene2': OutDF[1], 'EdgeWeight': OutDF[2], }))