Warning

This document is for an old release of Galaxy. You can alternatively view this page in the latest release if it exists or view the top of the latest release's documentation.

Source code for galaxy.datatypes.converters.lped_to_pbed_converter

# for rgenetics - lped to pbed
# where to stop with converters
# pbed might be central
# eg lped/eigen/fbat/snpmatrix all to pbed
# and pbed to lped/eigen/fbat/snpmatrix ?
# that's a lot of converters
from __future__ import print_function

import os
import subprocess
import sys
import time

prog = os.path.split(sys.argv[0])[-1]
myversion = 'Oct 10 2009'

galhtmlprefix = """<?xml version="1.0" encoding="utf-8" ?>
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
<head>
<meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
<meta name="generator" content="Galaxy %s tool output - see http://getgalaxy.org" />
<title></title>
<link rel="stylesheet" href="/static/style/base.css" type="text/css" />
</head>
<body>
<div class="document">
"""


[docs]def timenow(): """return current time as a string """ return time.strftime('%d/%m/%Y %H:%M:%S', time.localtime(time.time()))
[docs]def getMissval(inped=''): """ read some lines...ugly hack - try to guess missing value should be N or 0 but might be . or - """ commonmissvals = {'N': 'N', '0': '0', 'n': 'n', '9': '9', '-': '-', '.': '.'} try: f = open(inped, 'r') except: return None # signal no in file missval = None while missval is None: # doggedly continue until we solve the mystery try: l = f.readline() except: break ll = l.split()[6:] # ignore pedigree stuff for c in ll: if commonmissvals.get(c, None): missval = c f.close() return missval if not missval: missval = 'N' # punt f.close() return missval
[docs]def rgConv(inpedfilepath, outhtmlname, outfilepath, plink): """ """ pedf = '%s.ped' % inpedfilepath basename = os.path.split(inpedfilepath)[-1] # get basename outroot = os.path.join(outfilepath, basename) missval = getMissval(inped=pedf) if not missval: print('### lped_to_pbed_converter.py cannot identify missing value in %s' % pedf) missval = '0' subprocess.check_call([plink, '--noweb', '--file', inpedfilepath, '--make-bed', '--out', outroot, '--missing-genotype', missval], cwd=outfilepath)
[docs]def main(): """ need to work with rgenetics composite datatypes so in and out are html files with data in extrafiles path <command>python '$__tool_directory__/lped_to_pbed_converter.py' '$input1/$input1.metadata.base_name' '$output1' '$output1.extra_files_path' '${GALAXY_DATA_INDEX_DIR}/rg/bin/plink' </command> """ nparm = 4 if len(sys.argv) < nparm: sys.stderr.write('## %s called with %s - needs %d parameters \n' % (prog, sys.argv, nparm)) sys.exit(1) inpedfilepath = sys.argv[1] outhtmlname = sys.argv[2] outfilepath = sys.argv[3] try: os.makedirs(outfilepath) except: pass plink = sys.argv[4] rgConv(inpedfilepath, outhtmlname, outfilepath, plink) flist = os.listdir(outfilepath) with open(outhtmlname, 'w') as f: f.write(galhtmlprefix % prog) s = '## Rgenetics: http://rgenetics.org Galaxy Tools %s %s' % (prog, timenow()) # becomes info print(s) f.write('<div>%s\n<ol>' % (s)) for i, data in enumerate( flist ): f.write('<li><a href="%s">%s</a></li>\n' % (os.path.split(data)[-1], os.path.split(data)[-1])) f.write("</ol></div></div></body></html>")
if __name__ == "__main__": main()