darknet-yolov3.cfg 8.2 KB


  1. # Based on cfg/yolov3-voc.cfg
  2. [net]
  3. # Testing
  4. # batch=1
  5. # subdivisions=1
  6. # Training
  7. batch=64
  8. subdivisions=16
  9. width=416
  10. height=416
  11. channels=3
  12. momentum=0.9
  13. decay=0.0005
  14. angle=0
  15. saturation = 1.5
  16. exposure = 1.5
  17. hue=.1
  18. learning_rate=0.001
  19. burn_in=400
  20. max_batches=5200
  21. policy=steps
  22. steps=3800
  23. scales=.1
  24. [convolutional]
  25. batch_normalize=1
  26. filters=32
  27. size=3
  28. stride=1
  29. pad=1
  30. activation=leaky
  31. # Downsample
  32. [convolutional]
  33. batch_normalize=1
  34. filters=64
  35. size=3
  36. stride=2
  37. pad=1
  38. activation=leaky
  39. [convolutional]
  40. batch_normalize=1
  41. filters=32
  42. size=1
  43. stride=1
  44. pad=1
  45. activation=leaky
  46. [convolutional]
  47. batch_normalize=1
  48. filters=64
  49. size=3
  50. stride=1
  51. pad=1
  52. activation=leaky
  53. [shortcut]
  54. from=-3
  55. activation=linear
  56. # Downsample
  57. [convolutional]
  58. batch_normalize=1
  59. filters=128
  60. size=3
  61. stride=2
  62. pad=1
  63. activation=leaky
  64. [convolutional]
  65. batch_normalize=1
  66. filters=64
  67. size=1
  68. stride=1
  69. pad=1
  70. activation=leaky
  71. [convolutional]
  72. batch_normalize=1
  73. filters=128
  74. size=3
  75. stride=1
  76. pad=1
  77. activation=leaky
  78. [shortcut]
  79. from=-3
  80. activation=linear
  81. [convolutional]
  82. batch_normalize=1
  83. filters=64
  84. size=1
  85. stride=1
  86. pad=1
  87. activation=leaky
  88. [convolutional]
  89. batch_normalize=1
  90. filters=128
  91. size=3
  92. stride=1
  93. pad=1
  94. activation=leaky
  95. [shortcut]
  96. from=-3
  97. activation=linear
  98. # Downsample
  99. [convolutional]
  100. batch_normalize=1
  101. filters=256
  102. size=3
  103. stride=2
  104. pad=1
  105. activation=leaky
  106. [convolutional]
  107. batch_normalize=1
  108. filters=128
  109. size=1
  110. stride=1
  111. pad=1
  112. activation=leaky
  113. [convolutional]
  114. batch_normalize=1
  115. filters=256
  116. size=3
  117. stride=1
  118. pad=1
  119. activation=leaky
  120. [shortcut]
  121. from=-3
  122. activation=linear
  123. [convolutional]
  124. batch_normalize=1
  125. filters=128
  126. size=1
  127. stride=1
  128. pad=1
  129. activation=leaky
  130. [convolutional]
  131. batch_normalize=1
  132. filters=256
  133. size=3
  134. stride=1
  135. pad=1
  136. activation=leaky
  137. [shortcut]
  138. from=-3
  139. activation=linear
  140. [convolutional]
  141. batch_normalize=1
  142. filters=128
  143. size=1
  144. stride=1
  145. pad=1
  146. activation=leaky
  147. [convolutional]
  148. batch_normalize=1
  149. filters=256
  150. size=3
  151. stride=1
  152. pad=1
  153. activation=leaky
  154. [shortcut]
  155. from=-3
  156. activation=linear
  157. [convolutional]
  158. batch_normalize=1
  159. filters=128
  160. size=1
  161. stride=1
  162. pad=1
  163. activation=leaky
  164. [convolutional]
  165. batch_normalize=1
  166. filters=256
  167. size=3
  168. stride=1
  169. pad=1
  170. activation=leaky
  171. [shortcut]
  172. from=-3
  173. activation=linear
  174. [convolutional]
  175. batch_normalize=1
  176. filters=128
  177. size=1
  178. stride=1
  179. pad=1
  180. activation=leaky
  181. [convolutional]
  182. batch_normalize=1
  183. filters=256
  184. size=3
  185. stride=1
  186. pad=1
  187. activation=leaky
  188. [shortcut]
  189. from=-3
  190. activation=linear
  191. [convolutional]
  192. batch_normalize=1
  193. filters=128
  194. size=1
  195. stride=1
  196. pad=1
  197. activation=leaky
  198. [convolutional]
  199. batch_normalize=1
  200. filters=256
  201. size=3
  202. stride=1
  203. pad=1
  204. activation=leaky
  205. [shortcut]
  206. from=-3
  207. activation=linear
  208. [convolutional]
  209. batch_normalize=1
  210. filters=128
  211. size=1
  212. stride=1
  213. pad=1
  214. activation=leaky
  215. [convolutional]
  216. batch_normalize=1
  217. filters=256
  218. size=3
  219. stride=1
  220. pad=1
  221. activation=leaky
  222. [shortcut]
  223. from=-3
  224. activation=linear
  225. [convolutional]
  226. batch_normalize=1
  227. filters=128
  228. size=1
  229. stride=1
  230. pad=1
  231. activation=leaky
  232. [convolutional]
  233. batch_normalize=1
  234. filters=256
  235. size=3
  236. stride=1
  237. pad=1
  238. activation=leaky
  239. [shortcut]
  240. from=-3
  241. activation=linear
  242. # Downsample
  243. [convolutional]
  244. batch_normalize=1
  245. filters=512
  246. size=3
  247. stride=2
  248. pad=1
  249. activation=leaky
  250. [convolutional]
  251. batch_normalize=1
  252. filters=256
  253. size=1
  254. stride=1
  255. pad=1
  256. activation=leaky
  257. [convolutional]
  258. batch_normalize=1
  259. filters=512
  260. size=3
  261. stride=1
  262. pad=1
  263. activation=leaky
  264. [shortcut]
  265. from=-3
  266. activation=linear
  267. [convolutional]
  268. batch_normalize=1
  269. filters=256
  270. size=1
  271. stride=1
  272. pad=1
  273. activation=leaky
  274. [convolutional]
  275. batch_normalize=1
  276. filters=512
  277. size=3
  278. stride=1
  279. pad=1
  280. activation=leaky
  281. [shortcut]
  282. from=-3
  283. activation=linear
  284. [convolutional]
  285. batch_normalize=1
  286. filters=256
  287. size=1
  288. stride=1
  289. pad=1
  290. activation=leaky
  291. [convolutional]
  292. batch_normalize=1
  293. filters=512
  294. size=3
  295. stride=1
  296. pad=1
  297. activation=leaky
  298. [shortcut]
  299. from=-3
  300. activation=linear
  301. [convolutional]
  302. batch_normalize=1
  303. filters=256
  304. size=1
  305. stride=1
  306. pad=1
  307. activation=leaky
  308. [convolutional]
  309. batch_normalize=1
  310. filters=512
  311. size=3
  312. stride=1
  313. pad=1
  314. activation=leaky
  315. [shortcut]
  316. from=-3
  317. activation=linear
  318. [convolutional]
  319. batch_normalize=1
  320. filters=256
  321. size=1
  322. stride=1
  323. pad=1
  324. activation=leaky
  325. [convolutional]
  326. batch_normalize=1
  327. filters=512
  328. size=3
  329. stride=1
  330. pad=1
  331. activation=leaky
  332. [shortcut]
  333. from=-3
  334. activation=linear
  335. [convolutional]
  336. batch_normalize=1
  337. filters=256
  338. size=1
  339. stride=1
  340. pad=1
  341. activation=leaky
  342. [convolutional]
  343. batch_normalize=1
  344. filters=512
  345. size=3
  346. stride=1
  347. pad=1
  348. activation=leaky
  349. [shortcut]
  350. from=-3
  351. activation=linear
  352. [convolutional]
  353. batch_normalize=1
  354. filters=256
  355. size=1
  356. stride=1
  357. pad=1
  358. activation=leaky
  359. [convolutional]
  360. batch_normalize=1
  361. filters=512
  362. size=3
  363. stride=1
  364. pad=1
  365. activation=leaky
  366. [shortcut]
  367. from=-3
  368. activation=linear
  369. [convolutional]
  370. batch_normalize=1
  371. filters=256
  372. size=1
  373. stride=1
  374. pad=1
  375. activation=leaky
  376. [convolutional]
  377. batch_normalize=1
  378. filters=512
  379. size=3
  380. stride=1
  381. pad=1
  382. activation=leaky
  383. [shortcut]
  384. from=-3
  385. activation=linear
  386. # Downsample
  387. [convolutional]
  388. batch_normalize=1
  389. filters=1024
  390. size=3
  391. stride=2
  392. pad=1
  393. activation=leaky
  394. [convolutional]
  395. batch_normalize=1
  396. filters=512
  397. size=1
  398. stride=1
  399. pad=1
  400. activation=leaky
  401. [convolutional]
  402. batch_normalize=1
  403. filters=1024
  404. size=3
  405. stride=1
  406. pad=1
  407. activation=leaky
  408. [shortcut]
  409. from=-3
  410. activation=linear
  411. [convolutional]
  412. batch_normalize=1
  413. filters=512
  414. size=1
  415. stride=1
  416. pad=1
  417. activation=leaky
  418. [convolutional]
  419. batch_normalize=1
  420. filters=1024
  421. size=3
  422. stride=1
  423. pad=1
  424. activation=leaky
  425. [shortcut]
  426. from=-3
  427. activation=linear
  428. [convolutional]
  429. batch_normalize=1
  430. filters=512
  431. size=1
  432. stride=1
  433. pad=1
  434. activation=leaky
  435. [convolutional]
  436. batch_normalize=1
  437. filters=1024
  438. size=3
  439. stride=1
  440. pad=1
  441. activation=leaky
  442. [shortcut]
  443. from=-3
  444. activation=linear
  445. [convolutional]
  446. batch_normalize=1
  447. filters=512
  448. size=1
  449. stride=1
  450. pad=1
  451. activation=leaky
  452. [convolutional]
  453. batch_normalize=1
  454. filters=1024
  455. size=3
  456. stride=1
  457. pad=1
  458. activation=leaky
  459. [shortcut]
  460. from=-3
  461. activation=linear
  462. ######################
  463. [convolutional]
  464. batch_normalize=1
  465. filters=512
  466. size=1
  467. stride=1
  468. pad=1
  469. activation=leaky
  470. [convolutional]
  471. batch_normalize=1
  472. size=3
  473. stride=1
  474. pad=1
  475. filters=1024
  476. activation=leaky
  477. [convolutional]
  478. batch_normalize=1
  479. filters=512
  480. size=1
  481. stride=1
  482. pad=1
  483. activation=leaky
  484. [convolutional]
  485. batch_normalize=1
  486. size=3
  487. stride=1
  488. pad=1
  489. filters=1024
  490. activation=leaky
  491. [convolutional]
  492. batch_normalize=1
  493. filters=512
  494. size=1
  495. stride=1
  496. pad=1
  497. activation=leaky
  498. [convolutional]
  499. batch_normalize=1
  500. size=3
  501. stride=1
  502. pad=1
  503. filters=1024
  504. activation=leaky
  505. [convolutional]
  506. size=1
  507. stride=1
  508. pad=1
  509. # filters = (num/3) * (5+classes)
  510. filters=18
  511. activation=linear
  512. [yolo]
  513. mask = 6,7,8
  514. anchors = 10,13, 16,30, 33,23, 30,61, 62,45, 59,119, 116,90, 156,198, 373,326
  515. classes=1
  516. num=9
  517. jitter=.3
  518. ignore_thresh = .5
  519. truth_thresh = 1
  520. random=1
  521. [route]
  522. layers = -4
  523. [convolutional]
  524. batch_normalize=1
  525. filters=256
  526. size=1
  527. stride=1
  528. pad=1
  529. activation=leaky
  530. [upsample]
  531. stride=2
  532. [route]
  533. layers = -1, 61
  534. [convolutional]
  535. batch_normalize=1
  536. filters=256
  537. size=1
  538. stride=1
  539. pad=1
  540. activation=leaky
  541. [convolutional]
  542. batch_normalize=1
  543. size=3
  544. stride=1
  545. pad=1
  546. filters=512
  547. activation=leaky
  548. [convolutional]
  549. batch_normalize=1
  550. filters=256
  551. size=1
  552. stride=1
  553. pad=1
  554. activation=leaky
  555. [convolutional]
  556. batch_normalize=1
  557. size=3
  558. stride=1
  559. pad=1
  560. filters=512
  561. activation=leaky
  562. [convolutional]
  563. batch_normalize=1
  564. filters=256
  565. size=1
  566. stride=1
  567. pad=1
  568. activation=leaky
  569. [convolutional]
  570. batch_normalize=1
  571. size=3
  572. stride=1
  573. pad=1
  574. filters=512
  575. activation=leaky
  576. [convolutional]
  577. size=1
  578. stride=1
  579. pad=1
  580. # filters = (num/3) * (5+classes)
  581. filters=18
  582. activation=linear
  583. [yolo]
  584. mask = 3,4,5
  585. anchors = 10,13, 16,30, 33,23, 30,61, 62,45, 59,119, 116,90, 156,198, 373,326
  586. classes=1
  587. num=9
  588. jitter=.3
  589. ignore_thresh = .5
  590. truth_thresh = 1
  591. random=1
  592. [route]
  593. layers = -4
  594. [convolutional]
  595. batch_normalize=1
  596. filters=128
  597. size=1
  598. stride=1
  599. pad=1
  600. activation=leaky
  601. [upsample]
  602. stride=4
  603. [route]
  604. layers = -1, 11
  605. [convolutional]
  606. batch_normalize=1
  607. filters=128
  608. size=1
  609. stride=1
  610. pad=1
  611. activation=leaky
  612. [convolutional]
  613. batch_normalize=1
  614. size=3
  615. stride=1
  616. pad=1
  617. filters=256
  618. activation=leaky
  619. [convolutional]
  620. batch_normalize=1
  621. filters=128
  622. size=1
  623. stride=1
  624. pad=1
  625. activation=leaky
  626. [convolutional]
  627. batch_normalize=1
  628. size=3
  629. stride=1
  630. pad=1
  631. filters=256
  632. activation=leaky
  633. [convolutional]
  634. batch_normalize=1
  635. filters=128
  636. size=1
  637. stride=1
  638. pad=1
  639. activation=leaky
  640. [convolutional]
  641. batch_normalize=1
  642. size=3
  643. stride=1
  644. pad=1
  645. filters=256
  646. activation=leaky
  647. [convolutional]
  648. size=1
  649. stride=1
  650. pad=1
  651. # filters = (num/3) * (5+classes)
  652. filters=18
  653. activation=linear
  654. [yolo]
  655. mask = 0,1,2
  656. anchors = 10,13, 16,30, 33,23, 30,61, 62,45, 59,119, 116,90, 156,198, 373,326
  657. classes=1
  658. num=9
  659. jitter=.3
  660. ignore_thresh = .5
  661. truth_thresh = 1
  662. random=1