/
__main__.py
301 lines (274 loc) · 15.9 KB
/
__main__.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
import sys, os, argparse, glob, pathlib, time
import subprocess
import numpy as np
from natsort import natsorted
from tqdm import tqdm
from cellpose import utils, models, io
try:
from cellpose.gui import gui
GUI_ENABLED = True
except ImportError as err:
GUI_ERROR = err
GUI_ENABLED = False
GUI_IMPORT = True
except Exception as err:
GUI_ENABLED = False
GUI_ERROR = err
GUI_IMPORT = False
raise
import logging
logger = logging.getLogger(__name__)
def main():
parser = argparse.ArgumentParser(description='cellpose parameters')
parser.add_argument('--check_mkl', action='store_true', help='check if mkl working')
parser.add_argument('--mkldnn', action='store_true', help='for mxnet, force MXNET_SUBGRAPH_BACKEND = "MKLDNN"')
parser.add_argument('--train', action='store_true', help='train network using images in dir')
parser.add_argument('--dir', required=False,
default=[], type=str, help='folder containing data to run or train on')
parser.add_argument('--look_one_level_down', action='store_true',
help='')
parser.add_argument('--mxnet', action='store_true', help='use mxnet')
parser.add_argument('--img_filter', required=False,
default=[], type=str, help='end string for images to run on')
parser.add_argument('--use_gpu', action='store_true', help='use gpu if mxnet with cuda installed')
parser.add_argument('--fast_mode', action='store_true', help="make code run faster by turning off 4 network averaging")
parser.add_argument('--resample', action='store_true', help="run dynamics on full image (slower for images with large diameters)")
parser.add_argument('--no_interp', action='store_true', help='do not interpolate when running dynamics (was default)')
parser.add_argument('--do_3D', action='store_true',
help='process images as 3D stacks of images (nplanes x nchan x Ly x Lx')
# settings for running cellpose
parser.add_argument('--pretrained_model', required=False,
default='cyto', type=str, help='model to use')
parser.add_argument('--unet', required=False,
default=0, type=int, help='run standard unet instead of cellpose flow output')
parser.add_argument('--nclasses', required=False,
default=3, type=int, help='if running unet, choose 2 or 3, otherwise not used')
parser.add_argument('--chan', required=False,
default=0, type=int, help='channel to segment; 0: GRAY, 1: RED, 2: GREEN, 3: BLUE')
parser.add_argument('--chan2', required=False,
default=0, type=int, help='nuclear channel (if cyto, optional); 0: NONE, 1: RED, 2: GREEN, 3: BLUE')
parser.add_argument('--invert', required=False, action='store_true', help='invert grayscale channel')
parser.add_argument('--all_channels', action='store_true', help='use all channels in image if using own model and images with special channels')
parser.add_argument('--diameter', required=False,
default=30., type=float, help='cell diameter, if 0 cellpose will estimate for each image')
parser.add_argument('--flow_threshold', required=False,
default=0.4, type=float, help='flow error threshold, 0 turns off this optional QC step')
parser.add_argument('--cellprob_threshold', required=False,
default=0.0, type=float, help='cell probability threshold, centered at 0.0')
parser.add_argument('--save_png', action='store_true', help='save masks as png')
parser.add_argument('--save_outlines', action='store_true', help='save outlines as text file for ImageJ')
parser.add_argument('--save_tif', action='store_true', help='save masks as tif')
parser.add_argument('--no_npy', action='store_true', help='suppress saving of npy')
parser.add_argument('--channel_axis', required=False,
default=None, type=int, help='axis of image which corresponds to image channels')
parser.add_argument('--z_axis', required=False,
default=None, type=int, help='axis of image which corresponds to Z dimension')
parser.add_argument('--exclude_on_edges', action='store_true',
help='discard masks which touch edges of image')
# settings for training
parser.add_argument('--train_size', action='store_true', help='train size network at end of training')
parser.add_argument('--mask_filter', required=False,
default='_masks', type=str, help='end string for masks to run on')
parser.add_argument('--test_dir', required=False,
default=[], type=str, help='folder containing test data (optional)')
parser.add_argument('--learning_rate', required=False,
default=0.2, type=float, help='learning rate')
parser.add_argument('--n_epochs', required=False,
default=500, type=int, help='number of epochs')
parser.add_argument('--batch_size', required=False,
default=8, type=int, help='batch size')
parser.add_argument('--residual_on', required=False,
default=1, type=int, help='use residual connections')
parser.add_argument('--style_on', required=False,
default=1, type=int, help='use style vector')
parser.add_argument('--concatenation', required=False,
default=0, type=int, help='concatenate downsampled layers with upsampled layers (off by default which means they are added)')
args = parser.parse_args()
if args.check_mkl:
mkl_enabled = models.check_mkl((not args.mxnet))
else:
mkl_enabled = True
if not args.train and (mkl_enabled and args.mkldnn):
os.environ["MXNET_SUBGRAPH_BACKEND"]="MKLDNN"
else:
os.environ["MXNET_SUBGRAPH_BACKEND"]=""
if len(args.dir)==0:
if not GUI_ENABLED:
logger.critical('ERROR: %s'%GUI_ERROR)
if GUI_IMPORT:
logger.critical('GUI FAILED: GUI dependencies may not be installed, to install, run')
logger.critical(' pip install cellpose[gui]')
else:
gui.run()
else:
use_gpu = False
channels = [args.chan, args.chan2]
# find images
if len(args.img_filter)>0:
imf = args.img_filter
else:
imf = None
device, gpu = models.assign_device((not args.mxnet), args.use_gpu)
model_dir = models.model_dir
if not args.train and not args.train_size:
tic = time.time()
if not (args.pretrained_model=='cyto' or args.pretrained_model=='nuclei' or args.pretrained_model=='cyto2'):
cpmodel_path = args.pretrained_model
if not os.path.exists(cpmodel_path):
logger.warning('model path does not exist, using cyto model')
args.pretrained_model = 'cyto'
image_names = io.get_image_files(args.dir,
args.mask_filter,
imf=imf,
look_one_level_down=args.look_one_level_down)
nimg = len(image_names)
if args.diameter==0:
if args.pretrained_model=='cyto' or args.pretrained_model=='nuclei':
diameter = None
logger.info('>>>> estimating diameter for each image')
else:
logger.info('>>>> using user-specified model, no auto-diameter estimation available')
diameter = model.diam_mean
else:
diameter = args.diameter
logger.info('>>>> using diameter %0.2f for all images'%diameter)
cstr0 = ['GRAY', 'RED', 'GREEN', 'BLUE']
cstr1 = ['NONE', 'RED', 'GREEN', 'BLUE']
logger.info('>>>> running cellpose on %d images using chan_to_seg %s and chan (opt) %s'%
(nimg, cstr0[channels[0]], cstr1[channels[1]]))
if args.pretrained_model=='cyto' or args.pretrained_model=='nuclei' or args.pretrained_model=='cyto2':
if args.mxnet and args.pretrained_model=='cyto2':
logger.warning('cyto2 model not available in mxnet, using cyto model')
args.pretrained_model = 'cyto'
model = models.Cellpose(gpu=gpu, device=device, model_type=args.pretrained_model,
torch=(not args.mxnet))
else:
if args.all_channels:
channels = None
model = models.CellposeModel(gpu=gpu, device=device,
pretrained_model=cpmodel_path,
torch=(not args.mxnet))
tqdm_out = utils.TqdmToLogger(logger,level=logging.INFO)
for image_name in tqdm(image_names, file=tqdm_out):
image = io.imread(image_name)
out = model.eval(image, channels=channels, diameter=diameter,
do_3D=args.do_3D, net_avg=(not args.fast_mode),
augment=False,
resample=args.resample,
flow_threshold=args.flow_threshold,
cellprob_threshold=args.cellprob_threshold,
invert=args.invert,
batch_size=args.batch_size,
interp=(not args.no_interp),
channel_axis=args.channel_axis,
z_axis=args.z_axis)
masks, flows = out[:2]
if len(out) > 3:
diams = out[-1]
else:
diams = diameter
if args.exclude_on_edges:
masks = utils.remove_edge_masks(masks)
if not args.no_npy:
io.masks_flows_to_seg(image, masks, flows, diams, image_name, channels)
if args.save_png or args.save_tif or args.save_outlines:
io.save_masks(image, masks, flows, image_name,
png=args.save_png,
tif=args.save_tif,
outlines=args.save_outlines)
logger.info('>>>> completed in %0.3f sec'%(time.time()-tic))
else:
if args.pretrained_model=='cyto' or args.pretrained_model=='nuclei' or args.pretrained_model=='cyto2':
if args.mxnet and args.pretrained_model=='cyto2':
logger.warning('cyto2 model not available in mxnet, using cyto model')
args.pretrained_model = 'cyto'
torch_str = ['torch', '']
cpmodel_path = os.fspath(model_dir.joinpath('%s%s_0'%(args.pretrained_model, torch_str[args.mxnet])))
if args.pretrained_model=='cyto':
szmean = 30.
else:
szmean = 17.
else:
cpmodel_path = os.fspath(args.pretrained_model)
szmean = 30.
test_dir = None if len(args.test_dir)==0 else args.test_dir
output = io.load_train_test_data(args.dir, test_dir, imf, args.mask_filter, args.unet)
images, labels, image_names, test_images, test_labels, image_names_test = output
# training with all channels
if args.all_channels:
img = images[0]
if img.ndim==3:
nchan = min(img.shape)
elif img.ndim==2:
nchan = 1
channels = None
else:
nchan = 2
# model path
if not os.path.exists(cpmodel_path):
if not args.train:
error_message = 'ERROR: model path missing or incorrect - cannot train size model'
logger.critical(error_message)
raise ValueError(error_message)
cpmodel_path = False
logger.info('>>>> training from scratch')
if args.diameter==0:
rescale = False
logger.info('>>>> median diameter set to 0 => no rescaling during training')
else:
rescale = True
szmean = args.diameter
else:
rescale = True
args.diameter = szmean
logger.info('>>>> pretrained model %s is being used'%cpmodel_path)
args.residual_on = 1
args.style_on = 1
args.concatenation = 0
if rescale and args.train:
logger.info('>>>> during training rescaling images to fixed diameter of %0.1f pixels'%args.diameter)
# initialize model
if args.unet:
model = core.UnetModel(device=device,
pretrained_model=cpmodel_path,
diam_mean=szmean,
residual_on=args.residual_on,
style_on=args.style_on,
concatenation=args.concatenation,
nclasses=args.nclasses,
nchan=nchan)
else:
model = models.CellposeModel(device=device,
torch=(not args.mxnet),
pretrained_model=cpmodel_path,
diam_mean=szmean,
residual_on=args.residual_on,
style_on=args.style_on,
concatenation=args.concatenation,
nchan=nchan)
# train segmentation model
if args.train:
cpmodel_path = model.train(images, labels, train_files=image_names,
test_data=test_images, test_labels=test_labels, test_files=image_names_test,
learning_rate=args.learning_rate, channels=channels,
save_path=os.path.realpath(args.dir), rescale=rescale, n_epochs=args.n_epochs,
batch_size=args.batch_size)
model.pretrained_model = cpmodel_path
logger.info('>>>> model trained and saved to %s'%cpmodel_path)
# train size model
if args.train_size:
sz_model = models.SizeModel(cp_model=model, device=device)
sz_model.train(images, labels, test_images, test_labels, channels=channels, batch_size=args.batch_size)
if test_images is not None:
predicted_diams, diams_style = sz_model.eval(test_images, channels=channels)
if test_labels[0].ndim>2:
tlabels = [lbl[0] for lbl in test_labels]
else:
tlabels = test_labels
ccs = np.corrcoef(diams_style, np.array([utils.diameters(lbl)[0] for lbl in tlabels]))[0,1]
cc = np.corrcoef(predicted_diams, np.array([utils.diameters(lbl)[0] for lbl in tlabels]))[0,1]
logger.info('style test correlation: %0.4f; final test correlation: %0.4f'%(ccs,cc))
np.save(os.path.join(args.test_dir, '%s_predicted_diams.npy'%os.path.split(cpmodel_path)[1]),
{'predicted_diams': predicted_diams, 'diams_style': diams_style})
if __name__ == '__main__':
main()