| @@ -0,0 +1,244 @@ | ||
| [net] | ||
| batch=64 | ||
| subdivisions=8 | ||
| height=416 | ||
| width=416 | ||
| channels=3 | ||
| momentum=0.9 | ||
| decay=0.0005 | ||
| angle=0 | ||
| saturation = 1.5 | ||
| exposure = 1.5 | ||
| hue=.1 | ||
|
|
||
| learning_rate=0.0001 | ||
| max_batches = 45000 | ||
| policy=steps | ||
| steps=100,25000,35000 | ||
| scales=10,.1,.1 | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=32 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [maxpool] | ||
| size=2 | ||
| stride=2 | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=64 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [maxpool] | ||
| size=2 | ||
| stride=2 | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=128 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=64 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=128 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [maxpool] | ||
| size=2 | ||
| stride=2 | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=256 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=128 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=256 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [maxpool] | ||
| size=2 | ||
| stride=2 | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=512 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=256 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=512 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=256 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=512 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [maxpool] | ||
| size=2 | ||
| stride=2 | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=1024 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=512 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=1024 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=512 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=1024 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
|
|
||
| ####### | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| filters=1024 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| filters=1024 | ||
| activation=leaky | ||
|
|
||
| [route] | ||
| layers=-9 | ||
|
|
||
| [reorg] | ||
| stride=2 | ||
|
|
||
| [route] | ||
| layers=-1,-3 | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| filters=1024 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| filters=125 | ||
| activation=linear | ||
|
|
||
| [region] | ||
| anchors = 1.08,1.19, 3.42,4.41, 6.63,11.38, 9.42,5.11, 16.62,10.52 | ||
| bias_match=1 | ||
| classes=20 | ||
| coords=4 | ||
| num=5 | ||
| softmax=1 | ||
| jitter=.2 | ||
| rescore=1 | ||
|
|
||
| object_scale=5 | ||
| noobject_scale=1 | ||
| class_scale=1 | ||
| coord_scale=1 | ||
|
|
||
| absolute=1 | ||
| thresh = .6 | ||
| random=0 |
| @@ -0,0 +1,257 @@ | ||
| [net] | ||
| batch=1 | ||
| subdivisions=1 | ||
| height=448 | ||
| width=448 | ||
| channels=3 | ||
| momentum=0.9 | ||
| decay=0.0005 | ||
| saturation=1.5 | ||
| exposure=1.5 | ||
| hue=.1 | ||
|
|
||
| learning_rate=0.0005 | ||
| policy=steps | ||
| steps=200,400,600,20000,30000 | ||
| scales=2.5,2,2,.1,.1 | ||
| max_batches = 40000 | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=64 | ||
| size=7 | ||
| stride=2 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [maxpool] | ||
| size=2 | ||
| stride=2 | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=192 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [maxpool] | ||
| size=2 | ||
| stride=2 | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=128 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=256 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=256 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=512 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [maxpool] | ||
| size=2 | ||
| stride=2 | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=256 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=512 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=256 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=512 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=256 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=512 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=256 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=512 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=512 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=1024 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [maxpool] | ||
| size=2 | ||
| stride=2 | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=512 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=1024 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=512 | ||
| size=1 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| filters=1024 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| activation=leaky | ||
|
|
||
| ####### | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| filters=1024 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| size=3 | ||
| stride=2 | ||
| pad=1 | ||
| filters=1024 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| filters=1024 | ||
| activation=leaky | ||
|
|
||
| [convolutional] | ||
| batch_normalize=1 | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| filters=1024 | ||
| activation=leaky | ||
|
|
||
| [local] | ||
| size=3 | ||
| stride=1 | ||
| pad=1 | ||
| filters=256 | ||
| activation=leaky | ||
|
|
||
| [dropout] | ||
| probability=.5 | ||
|
|
||
| [connected] | ||
| output= 1715 | ||
| activation=linear | ||
|
|
||
| [detection] | ||
| classes=20 | ||
| coords=4 | ||
| rescore=1 | ||
| side=7 | ||
| num=3 | ||
| softmax=0 | ||
| sqrt=1 | ||
| jitter=.2 | ||
|
|
||
| object_scale=1 | ||
| noobject_scale=.5 | ||
| class_scale=1 | ||
| coord_scale=5 | ||
|
|
| @@ -0,0 +1,80 @@ | ||
| person | ||
| bicycle | ||
| car | ||
| motorbike | ||
| aeroplane | ||
| bus | ||
| train | ||
| truck | ||
| boat | ||
| traffic light | ||
| fire hydrant | ||
| stop sign | ||
| parking meter | ||
| bench | ||
| bird | ||
| cat | ||
| dog | ||
| horse | ||
| sheep | ||
| cow | ||
| elephant | ||
| bear | ||
| zebra | ||
| giraffe | ||
| backpack | ||
| umbrella | ||
| handbag | ||
| tie | ||
| suitcase | ||
| frisbee | ||
| skis | ||
| snowboard | ||
| sports ball | ||
| kite | ||
| baseball bat | ||
| baseball glove | ||
| skateboard | ||
| surfboard | ||
| tennis racket | ||
| bottle | ||
| wine glass | ||
| cup | ||
| fork | ||
| knife | ||
| spoon | ||
| bowl | ||
| banana | ||
| apple | ||
| sandwich | ||
| orange | ||
| broccoli | ||
| carrot | ||
| hot dog | ||
| pizza | ||
| donut | ||
| cake | ||
| chair | ||
| sofa | ||
| pottedplant | ||
| bed | ||
| diningtable | ||
| toilet | ||
| tvmonitor | ||
| laptop | ||
| mouse | ||
| remote | ||
| keyboard | ||
| cell phone | ||
| microwave | ||
| oven | ||
| toaster | ||
| sink | ||
| refrigerator | ||
| book | ||
| clock | ||
| vase | ||
| scissors | ||
| teddy bear | ||
| hair drier | ||
| toothbrush |
| @@ -5,7 +5,7 @@ | ||
|
|
||
| route_layer make_route_layer(int batch, int n, int *input_layers, int *input_sizes) | ||
| { | ||
| fprintf(stderr,"route "); | ||
| route_layer l = {0}; | ||
| l.type = ROUTE; | ||
| l.batch = batch; | ||