-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathrun_luigi_pipeline.py
executable file
·83 lines (74 loc) · 2.96 KB
/
run_luigi_pipeline.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
import argparse
import luigi
from cyto_ml.pipeline.pipeline_decollage import FlowCamPipeline
from cyto_ml.data.flowcam import parse_filename
import logging
<<<<<<< HEAD
=======
>>>>>>> main
logging.basicConfig(level=logging.INFO)
if __name__ == "__main__":
parser = argparse.ArgumentParser(
<<<<<<< HEAD
prog="Luigi FlowCam pipeline",
description="Triggers the process of decollaging images, embedding spatio-temporal metadata in headers, and uploading to s3 storage",
)
parser.add_argument(
"-o",
"--output_directory",
type=str,
default="./data/images_decollage",
help="directory for intermediate data",
)
parser.add_argument(
"-d",
"--directory",
type=str,
default="./tests/fixtures/MicrobialMethane_MESO_Tank10_54.0143_-2.7770_04052023_1",
help="Enable verbose mode",
)
parser.add_argument("-s", "--s3_bucket", type=str, default="untagged-images-lana")
parser.add_argument("-e", "--experiment_name", type=str)
args = parser.parse_args()
experiment = args.experiment_name
if not experiment or experiment == "":
try:
prefix, _, _, date, _ = parse_filename(args.directory)
experiment = "".join([prefix, date])
except ValueError as err:
logging.info(
"Could't figure out experiment name and date from {args.directory} - please call this with --experiment_name to set this"
)
logging.debug(err)
# TODO this properly
experiment = str(args.directory).split("/")[-2]
=======
prog='Luigi FlowCam pipeline',
description='Triggers the process of decollaging images, embedding spatio-temporal metadata in headers, and uploading to s3 storage',
)
parser.add_argument('-o', '--output_directory', type=str, default="./data/images_decollage", help="directory for intermediate data")
parser.add_argument('-d', '--directory', type=str, default="./tests/fixtures/MicrobialMethane_MESO_Tank10_54.0143_-2.7770_04052023_1", help='Enable verbose mode')
parser.add_argument('-s', '--s3_bucket', type=str, default="untagged-images-lana")
parser.add_argument('-e', '--experiment_name', type=str)
args = parser.parse_args()
experiment = args.experiment_name
if not experiment:
try:
prefix, _, _, date, _ = parse_filename(args.directory)
experiment = ''.join([prefix, date])
except ValueError as err:
logging.info("Could't figure out experiment name and date from {args.directory} - please call this with --experiment_name to set this")
logging.debug(err)
exit
>>>>>>> main
luigi.build(
[
FlowCamPipeline(
directory=args.directory,
output_directory=args.output_directory,
experiment_name=experiment,
s3_bucket=args.s3_bucket,
)
],
local_scheduler=False,
)