-
Constantin Pape authoredConstantin Pape authored
update_regestration.py 7.50 KiB
#! /g/arendt/EM_6dpf_segmentation/platy-browser-data/software/conda/miniconda3/envs/platybrowser/bin/python
import os
import json
import argparse
from subprocess import check_output
from concurrent import futures
import imageio
import luigi
import numpy as np
from pybdv import make_bdv
from scripts.files import copy_release_folder, make_folder_structure, make_bdv_server_file
from scripts.release_helper import add_version
from scripts.extension.registration import ApplyRegistrationLocal, ApplyRegistrationSlurm
from scripts.default_config import get_default_shebang
REGION_NAMES = ('AllGlands',
'CrypticSegment',
'Glands',
'Head',
'PNS',
'Pygidium',
'RestOfAnimal',
'Stomodeum',
'VNC',
'ProSPr6-Ref')
def get_tags(new_tag):
tag = check_output(['git', 'describe', '--abbrev=0']).decode('utf-8').rstrip('\n')
if new_tag is None:
new_tag = tag.split('.')
new_tag[-1] = str(int(new_tag[-1]) + 1)
new_tag = '.'.join(new_tag)
return tag, new_tag
def get_out_name(prefix, name):
name = os.path.split(name)[1]
name = os.path.splitext(name)[0]
name = name.split('--')[0]
# TODO split off further extensions here?
# name = name.split('-')[0]
if name in REGION_NAMES:
name = '-'.join([prefix, 'segmented', name])
elif name.startswith('edu'): # edus are no meds
name = '-'.join([prefix, name])
else:
name = '-'.join([prefix, name, 'MED'])
return name
def copy_file(in_path, out_path, resolution=[.55, .55, .55]):
if os.path.exists(out_path + '.xml'):
return
print("Copy", in_path, "to", out_path)
vol = np.asarray(imageio.volread(in_path + '-ch0.tif'))
downscale_factors = [[2, 2, 2], [2, 2, 2], [2, 2, 2]]
make_bdv(vol, out_path, downscale_factors,
unit='micrometer', resolution=resolution)
def copy_to_h5(inputs, output_folder):
print("Copy tifs to bdv/hdf5 in", output_folder)
outputs = [os.path.join(output_folder, os.path.split(inp)[1]) for inp in inputs]
n_jobs = 48
with futures.ProcessPoolExecutor(n_jobs) as tp:
tasks = [tp.submit(copy_file, inp, outp) for inp, outp in zip(inputs, outputs)]
[t.result() for t in tasks]
def apply_registration(input_folder, new_folder,
transformation_file, source_prefix,
target, max_jobs):
task = ApplyRegistrationSlurm if target == 'slurm' else ApplyRegistrationLocal
tmp_folder = './tmp_registration'
os.makedirs(tmp_folder, exist_ok=True)
# find all input files
names = os.listdir(input_folder)
inputs = [os.path.join(input_folder, name) for name in names]
if len(inputs) == 0:
raise RuntimeError("Did not find any files with prefix %s in %s" % (source_prefix,
input_folder))
# writing multiple hdf5 files in parallel with the elastix plugin is broken,
# so we write temporary files to tif instead and copy them to hdf5 with python
# output_folder = os.path.join(new_folder, 'images')
output_folder = os.path.join(tmp_folder, 'outputs')
os.makedirs(output_folder, exist_ok=True)
output_names = [get_out_name(source_prefix, name) for name in inputs]
outputs = [os.path.join(output_folder, name) for name in output_names]
# update the task config
config_dir = os.path.join(tmp_folder, 'config')
os.makedirs(config_dir, exist_ok=True)
shebang = get_default_shebang()
global_config = task.default_global_config()
global_config.update({'shebang': shebang})
with open(os.path.join(config_dir, 'global.config'), 'w') as f:
json.dump(global_config, f)
task_config = task.default_task_config()
task_config.update({'mem_limit': 16, 'time_limit': 240, 'threads_per_job': 4})
with open(os.path.join(config_dir, 'apply_registration.config'), 'w') as f:
json.dump(task_config, f)
# write path name files to json
input_file = os.path.join(tmp_folder, 'input_files.json')
inputs = [os.path.abspath(inpath) for inpath in inputs]
with open(input_file, 'w') as f:
json.dump(inputs, f)
output_file = os.path.join(tmp_folder, 'output_files.json')
outputs = [os.path.abspath(outpath) for outpath in outputs]
with open(output_file, 'w') as f:
json.dump(outputs, f)
t = task(tmp_folder=tmp_folder, config_dir=config_dir, max_jobs=max_jobs,
input_path_file=input_file, output_path_file=output_file,
transformation_file=transformation_file, output_format='tif')
ret = luigi.build([t], local_scheduler=True)
if not ret:
raise RuntimeError("Registration failed")
output_folder = os.path.join(new_folder, 'images')
copy_to_h5(outputs, output_folder)
def update_regestration(transformation_file, input_folder, source_prefix, target, max_jobs,
new_tag=None):
""" Update the prospr segmentation.
This is a special case of 'update_patch', that applies a new prospr registration.
Arguments:
transformation_file [str] - path to the transformation used to register
input_folder [str] - folder with unregistered data
source_prefix [str] - prefix of the source data to apply the registration to
target [str] - target of computation
max_jobs [int] - max number of jobs for computation
new_tag [str] - new version tag (default: None)
"""
tag, new_tag = get_tags(new_tag)
print("Updating platy browser from", tag, "to", new_tag)
# make new folder structure
folder = os.path.join('data', tag)
new_folder = os.path.join('data', new_tag)
make_folder_structure(new_folder)
# copy the release folder
copy_release_folder(folder, new_folder, exclude_prefixes=[source_prefix])
# apply new registration to all files of the source prefix
transformation_file = os.path.abspath(transformation_file)
apply_registration(input_folder, new_folder,
transformation_file, source_prefix,
target, max_jobs)
add_version(new_tag)
make_bdv_server_file(new_folder, os.path.join(new_folder, 'misc', 'bdv_server.txt'),
relative_paths=True)
if __name__ == '__main__':
parser = argparse.ArgumentParser(description='Update prospr registration in platy-browser-data.')
parser.add_argument('transformation_file', type=str, help="path to transformation file")
parser.add_argument('--input_folder', type=str, default="data/rawdata/prospr",
help="Folder with (not registered) input files")
help_str = "Prefix for the input data. Please change this if you change the 'input_folder' from its default value"
parser.add_argument('--source_prefix', type=str, default="prospr-6dpf-1-whole",
help=help_str)
parser.add_argument('--target', type=str, default='slurm',
help="Computatin plaform, can be 'slurm' or 'local'")
parser.add_argument('--max_jobs', type=int, default=100,
help="Maximal number of jobs used for computation")
parser.add_argument('--new_tag', type=str, default='',
help="New version tag")
args = parser.parse_args()
new_tag = args.new_tag
new_tag = None if new_tag == '' else new_tag
update_regestration(args.transformation_file, args.input_folder, args.source_prefix,
args.target, args.max_jobs, new_tag)