darknet-metadata.json 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481
  1. [
  2. {
  3. "name": "avgpool",
  4. "category": "Pool"
  5. },
  6. {
  7. "name": "batchnorm",
  8. "category": "Normalization"
  9. },
  10. {
  11. "name": "connected",
  12. "category": "Layer",
  13. "attributes": [
  14. { "name": "output", "type": "int32", "visible": false, "default": 1 },
  15. { "name": "activation", "type": "string", "default": "logistic", "description": "options are: LOGISTIC, RELU, RELIE, LINEAR, RAMP, TANH, PLSE, LEAKY, ELU, LOGGY, STAIR, HARDTAN, LHTAN, SELU, SWISH, MISH" },
  16. { "name": "batch_normalize", "type": "int32", "default": 0 }
  17. ]
  18. },
  19. {
  20. "name": "conv_lstm",
  21. "category": "Layer",
  22. "attributes": [
  23. { "name": "batch_normalize", "type": "int32", "default": 0 },
  24. { "name": "activation", "type": "string", "default": "linear", "description": "options are: LOGISTIC, RELU, RELIE, LINEAR, RAMP, TANH, PLSE, LEAKY, ELU, LOGGY, STAIR, HARDTAN, LHTAN, SELU, SWISH, MISH" },
  25. { "name": "size", "type": "int32", "default": 3 },
  26. { "name": "stride", "type": "int32", "default": 1 },
  27. { "name": "dilation", "default": 1 },
  28. { "name": "groups", "type": "int32", "default": 1 },
  29. { "name": "padding", "type": "int32", "default": 0 },
  30. { "name": "pad", "type": "int32", "default": 0 },
  31. { "name": "xnor", "type": "int32", "default": 0 },
  32. { "name": "shortcut", "default": 0 },
  33. { "name": "output", "type": "int32", "default": 1 },
  34. { "name": "state_constrain", "type": "int32", "default": 16 },
  35. { "name": "peephole", "type": "int32", "default": 0 }
  36. ]
  37. },
  38. {
  39. "name": "convolutional",
  40. "category": "Layer",
  41. "attributes": [
  42. { "name": "filters", "type": "int32", "default": 1 },
  43. { "name": "size", "type": "int32", "default": 1 },
  44. { "name": "stride", "type": "int32", "default": 1 },
  45. { "name": "stride_x", "type": "int32", "default": -1 },
  46. { "name": "stride_y", "type": "int32", "default": -1 },
  47. { "name": "groups", "type": "int32", "default": 1 },
  48. { "name": "padding", "type": "int32", "default": 0 },
  49. { "name": "pad", "type": "int32", "default": 0 },
  50. { "name": "dilation", "default": 1 },
  51. { "name": "share_index", "default": -1000000000 },
  52. { "name": "binary", "type": "int32", "default": 0 },
  53. { "name": "xnor", "type": "int32", "default": 0 },
  54. { "name": "bin_output", "type": "int32", "default": 0 },
  55. { "name": "flipped", "type": "int32", "default": 0 },
  56. { "name": "dot", "type": "float32", "default": 0 },
  57. { "name": "batch_normalize", "type": "int32", "default": 0 },
  58. { "name": "activation", "type": "string", "default": "logistic", "description": "options are: LOGISTIC, RELU, RELIE, LINEAR, RAMP, TANH, PLSE, LEAKY, ELU, LOGGY, STAIR, HARDTAN, LHTAN, SELU, SWISH, MISH" }
  59. ]
  60. },
  61. {
  62. "name": "cost",
  63. "category": "Activation",
  64. "attributes": [
  65. { "name": "type", "type": "string", "default": "sse" },
  66. { "name": "scale", "type": "float32", "default": 1 },
  67. { "name": "ratio", "type": "float32", "default": 0 }
  68. ]
  69. },
  70. {
  71. "name": "crnn",
  72. "category": "Layer",
  73. "attributes": [
  74. { "name": "batch_normalize", "type": "int32", "default": 0 },
  75. { "name": "activation", "type": "string", "default": "logistic" },
  76. { "name": "dilation", "default": 1 },
  77. { "name": "padding", "default": 0 },
  78. { "name": "pad", "type": "int32", "default": 0 },
  79. { "name": "groups", "type": "int32", "default": 1 },
  80. { "name": "xnor", "type": "int32", "default": 0 },
  81. { "name": "shortcut", "type": "int32", "default": 0 },
  82. { "name": "output_filters", "default": 1 },
  83. { "name": "hidden_filters", "default": 1 }
  84. ]
  85. },
  86. {
  87. "name": "crop",
  88. "category": "Shape",
  89. "attributes": [
  90. { "name": "crop_height", "type": "int32", "default": 1 },
  91. { "name": "crop_width", "type": "int32", "default": 1 },
  92. { "name": "flip", "type": "int32", "default": 0 },
  93. { "name": "exposure", "type": "float32", "default": 1 },
  94. { "name": "saturation", "type": "float32", "default": 1 },
  95. { "name": "angle", "type": "float32", "default": 0 },
  96. { "name": "noadjust", "default": 0 },
  97. { "name": "shift", "type": "float32", "default": 0 }
  98. ]
  99. },
  100. {
  101. "name": "deconvolutional",
  102. "category": "Layer",
  103. "attributes": [
  104. { "name": "filters", "type": "int32", "visible": false, "default": 1 },
  105. { "name": "size", "type": "int32", "default": 1 },
  106. { "name": "stride", "type": "int32", "default": 1 },
  107. { "name": "padding", "type": "int32", "default": 0 },
  108. { "name": "pad", "type": "int32", "default": 0 },
  109. { "name": "batch_normalize", "type": "int32", "default": 0 },
  110. { "name": "activation", "type": "string", "default": "logistic", "description": "options are: LOGISTIC, RELU, RELIE, LINEAR, RAMP, TANH, PLSE, LEAKY, ELU, LOGGY, STAIR, HARDTAN, LHTAN, SELU, SWISH, MISH" }
  111. ]
  112. },
  113. {
  114. "name": "detection",
  115. "category": "Layer",
  116. "attributes": [
  117. { "name": "classes", "type": "int32", "default": 1 },
  118. { "name": "coord", "type": "int32", "default": 1 },
  119. { "name": "num", "type": "int32", "default": 1 },
  120. { "name": "jitter", "type": "float32", "default": 0.2 },
  121. { "name": "coord_scale", "type": "float32", "default": 1 },
  122. { "name": "object_scale", "type": "float32", "default": 1 },
  123. { "name": "noobject_scale", "type": "float32", "default": 1 },
  124. { "name": "class_scale", "type": "float32", "default": 1 },
  125. { "name": "forced", "type": "int32", "default": 0 },
  126. { "name": "side", "type": "int32", "default": 7 },
  127. { "name": "softmax", "type": "int32", "default": 0 },
  128. { "name": "sqrt", "type": "int32", "default": 0 },
  129. { "name": "max", "type": "int32", "default": 30 },
  130. { "name": "rescore", "type": "int32", "default": 0 },
  131. { "name": "random", "type": "int32", "default": 0 },
  132. { "name": "reorg", "type": "int32", "default": 0 }
  133. ]
  134. },
  135. {
  136. "name": "dropout",
  137. "category": "Dropout",
  138. "attributes": [
  139. { "name": "probability", "type": "float32", "default": 0.5 },
  140. { "name": "dropblock", "type": "int32", "default": 0 },
  141. { "name": "dropblock_size_rel", "type": "float32", "default": 0 },
  142. { "name": "dropblock_size_abs ", "type": "int32", "default": 7 }
  143. ]
  144. },
  145. {
  146. "name": "elu",
  147. "category": "Activation"
  148. },
  149. {
  150. "name": "gaussian_yolo",
  151. "category": "Layer",
  152. "attributes": [
  153. { "name": "classes", "type": "int32", "default": 20 },
  154. { "name": "num", "type": "int32", "default": 1 },
  155. { "name": "mask", "type": "string", "default": 0 },
  156. { "name": "jitter", "type": "float32", "default": 0.2 },
  157. { "name": "label_smooth_eps", "type": "float32", "default": 0 },
  158. { "name": "scale_x_y", "type": "float32", "default": 1 },
  159. { "name": "uc_normalizer", "type": "float32", "default": 1 },
  160. { "name": "iou_normalizer", "type": "float32", "default": 0.75 },
  161. { "name": "cls_normalizer", "type": "float32", "default": 1 },
  162. { "name": "iou_loss", "type": "string", "default": "mse", "description": "options are: mse, giou, diou, and ciou" },
  163. { "name": "max", "default": 90 },
  164. { "name": "ignore_thresh", "type": "float32", "default": 0.5 },
  165. { "name": "truth_thresh", "default": 1 },
  166. { "name": "iou_thresh", "type": "float32", "default": 1, "description": "recommended to use iou_thresh=0.213" },
  167. { "name": "random", "type": "int32", "default": 0 },
  168. { "name": "map", "type": "string", "default": 0 },
  169. { "name": "beta_nms", "type": "float32", "default": 0.6 },
  170. { "name": "nms_kind", "type": "string", "default": "default", "description": "options are: greedynms, diounms, cornersnms, or defaultnms" },
  171. { "name": "anchors", "type": "string", "default": 0 },
  172. { "name": "yolo_point", "type": "string", "default": "center", "description": "options are: center, left_top, and right_bottom" }
  173. ]
  174. },
  175. {
  176. "name": "gru",
  177. "category": "Layer",
  178. "attributes": [
  179. { "name": "output", "type": "int32", "visible": false, "default": 1 },
  180. { "name": "batch_normalize", "type": "int32", "default": 0 }
  181. ]
  182. },
  183. {
  184. "name": "h_swish",
  185. "category": "Activation"
  186. },
  187. {
  188. "name": "hardtan",
  189. "category": "Activation"
  190. },
  191. {
  192. "name": "leaky",
  193. "category": "Activation"
  194. },
  195. {
  196. "name": "lhtan",
  197. "category": "Activation"
  198. },
  199. {
  200. "name": "linear",
  201. "category": "Activation"
  202. },
  203. {
  204. "name": "local",
  205. "category": "Layer",
  206. "attributes": [
  207. { "name": "filters", "type": "int32", "visible": false, "default": 1 },
  208. { "name": "size", "type": "int32", "default": 1 },
  209. { "name": "stride", "type": "int32", "default": 1 },
  210. { "name": "padding", "type": "int32", "default": 0 },
  211. { "name": "pad", "type": "int32", "default": 0 },
  212. { "name": "activation", "type": "string", "default": "logistic", "description": "options are: LOGISTIC, RELU, RELIE, LINEAR, RAMP, TANH, PLSE, LEAKY, ELU, LOGGY, STAIR, HARDTAN, LHTAN, SELU, SWISH, MISH" }
  213. ]
  214. },
  215. {
  216. "name": "loggy",
  217. "category": "Activation"
  218. },
  219. {
  220. "name": "logistic",
  221. "category": "Activation"
  222. },
  223. {
  224. "name": "lstm",
  225. "category": "Layer",
  226. "attributes": [
  227. { "name": "output", "type": "int32", "visible": false, "default": 1 },
  228. { "name": "batch_normalize", "type": "int32", "default": 0 }
  229. ]
  230. },
  231. {
  232. "name": "maxpool",
  233. "category": "Pool",
  234. "attributes": [
  235. { "name": "stride", "type": "int32", "default": 1 },
  236. { "name": "stride_x", "type": "int32", "default": 1 },
  237. { "name": "stride_y", "type": "int32", "default": 1 },
  238. { "name": "size", "type": "int32", "default": 1 },
  239. { "name": "padding", "type": "int32", "default": 0 },
  240. { "name": "maxpool_depth", "type": "int32", "default": 0 },
  241. { "name": "out_channels", "default": 1 },
  242. { "name": "antialiasing", "type": "int32", "default": 0 }
  243. ]
  244. },
  245. {
  246. "name": "mish",
  247. "category": "Activation"
  248. },
  249. {
  250. "name": "net",
  251. "attributes": [
  252. { "name": "batch", "type": "int32", "default": 1 },
  253. { "name": "max_batches", "type": "int32", "default": 0, "description": "Limits the maximum number of iterations" },
  254. { "name": "learning_rate", "type": "float32", "default": 0.001 },
  255. { "name": "momentum", "type": "float32", "default": 0.9 },
  256. { "name": "decay", "type": "float32", "default": 0.0001 },
  257. { "name": "subdivisions", "type": "int32", "default": 1, "description": "In concert with batch property, this greatly affect memory usage, minimal working number is recommended" },
  258. { "name": "time_steps", "type": "int32", "default": 1 },
  259. { "name": "notruth", "type": "int32", "default": 0 },
  260. { "name": "random", "type": "int32", "default": 0 },
  261. { "name": "adam", "type": "int32", "default": 0 },
  262. { "name": "B1", "type": "float32", "default": 0.9 },
  263. { "name": "B2", "type": "float32", "default": 0.999 },
  264. { "name": "eps", "type": "float32", "default": 1e-7 },
  265. { "name": "height", "type": "int32", "default": 0 },
  266. { "name": "width", "type": "int32", "default": 0 },
  267. { "name": "channels", "type": "int32", "default": 0 },
  268. { "name": "inputs", "type": "int32" },
  269. { "name": "max_crop", "type": "int32" },
  270. { "name": "min_crop", "type": "int32" },
  271. { "name": "max_ratio", "type": "float32" },
  272. { "name": "min_ratio", "type": "float32" },
  273. { "name": "center", "type": "int32", "default": 0 },
  274. { "name": "clip", "type": "int32", "default": 0 },
  275. { "name": "angle", "type": "float32", "default": 0 },
  276. { "name": "aspect", "type": "float32", "default": 1 },
  277. { "name": "saturation", "type": "float32", "default": 1 },
  278. { "name": "exposure", "type": "float32", "default": 1 },
  279. { "name": "hue", "type": "float32", "default": 0 },
  280. { "name": "power", "type": "float32", "default": 4 },
  281. { "name": "flip", "type": "int32", "default": 1, "description": "Enables augmentation method: horizontal flip" },
  282. { "name": "blur", "type": "int32", "default": 0, "description": "Enables augmentation method: backgound blurring" },
  283. { "name": "mixup", "type": "int32", "default": 0, "description": "Enables augmentation method: images mixup" },
  284. { "name": "cutmix", "type": "int32", "default": 0, "description": "Enables augmentation method: images cutmix" },
  285. { "name": "mosaic", "type": "int32", "default": 0, "description": "Enables augmentation method: images mosaicing" },
  286. { "name": "letter_box", "type": "int32", "default": 0, "description": "Enables letter-box resizing (keeping the aspect ratio)" },
  287. { "name": "policy", "type": "string", "default": "constant" },
  288. { "name": "burn_in", "type": "int32", "default": 0, "description": "Is used for MAP calculation: permit a minimal number of iteration before first MAP check" },
  289. { "name": "letter_box", "type": "int32", "default": 0 },
  290. { "name": "optimized_memory", "type": "int32", "default": 0, "description": "can offload memory from GPU into CPU at the cost of speed, 3 options are possible please look at: https://github.com/AlexeyAB/darknet/issues/4386" },
  291. { "name": "workspace_size_limit_MB", "type": "float32", "default": 1024 }
  292. ]
  293. },
  294. {
  295. "name": "norm_chan",
  296. "category": "Activation"
  297. },
  298. {
  299. "name": "norm_chan_softmax",
  300. "category": "Activation"
  301. },
  302. {
  303. "name": "normalization",
  304. "category": "Normalization",
  305. "attributes": [
  306. { "name": "alpha", "type": "float32", "default": 0.0001 },
  307. { "name": "beta", "type": "float32", "default": 0.75 },
  308. { "name": "kappa", "type": "float32", "default": 1 },
  309. { "name": "size", "default": 5 }
  310. ]
  311. },
  312. {
  313. "name": "plse",
  314. "category": "Activation"
  315. },
  316. {
  317. "name": "ramp",
  318. "category": "Activation"
  319. },
  320. {
  321. "name": "region",
  322. "category": "Layer",
  323. "attributes": [
  324. { "name": "classes", "type": "int32", "default": 20 },
  325. { "name": "coord", "default": 4 },
  326. { "name": "num", "default": 1 },
  327. { "name": "mask", "type": "string", "default": 0 },
  328. { "name": "jitter", "type": "float32", "default": 0.2 },
  329. { "name": "classfix", "type": "int32", "default": 0 },
  330. { "name": "coord_scale", "type": "float32", "default": 1 },
  331. { "name": "object_scale", "type": "float32", "default": 1 },
  332. { "name": "noobject_scale", "type": "float32", "default": 1 },
  333. { "name": "mask_scale", "type": "float32", "default": 1 },
  334. { "name": "class_scale", "type": "float32", "default": 1 },
  335. { "name": "bias_match", "type": "int32", "default": 0 },
  336. { "name": "focal_loss", "type": "int32", "default": 0 },
  337. { "name": "max", "type": "int32", "default": 90 },
  338. { "name": "softmax", "type": "int32", "default": 0 },
  339. { "name": "rescore", "type": "int32", "default": 0 },
  340. { "name": "thresh", "type": "float32", "default": 0.5 },
  341. { "name": "random", "type": "int32", "default": 0 },
  342. { "name": "map", "type": "string", "default": 0 },
  343. { "name": "tree", "type": "string", "default": 0 },
  344. { "name": "anchors", "type": "string", "default": 0 },
  345. { "name": "absolute", "default": 0 },
  346. { "name": "log", "default": 0 },
  347. { "name": "sqrt", "default": 0 }
  348. ]
  349. },
  350. {
  351. "name": "relie",
  352. "category": "Activation"
  353. },
  354. {
  355. "name": "relu",
  356. "category": "Activation"
  357. },
  358. {
  359. "name": "relu6",
  360. "category": "Activation"
  361. },
  362. {
  363. "name": "reorg",
  364. "category": "Shape",
  365. "attributes": [
  366. { "name": "stride", "default": 1 },
  367. { "name": "reverse", "type": "int32", "default": 0 }
  368. ]
  369. },
  370. {
  371. "name": "rnn",
  372. "category": "Layer",
  373. "attributes": [
  374. { "name": "output", "type": "int32", "visible": false },
  375. { "name": "hidden", "visible": false, "default": 1 },
  376. { "name": "activation", "type": "string", "default": "logistic", "description": "options are: LOGISTIC, RELU, RELIE, LINEAR, RAMP, TANH, PLSE, LEAKY, ELU, LOGGY, STAIR, HARDTAN, LHTAN, SELU, SWISH, MISH" },
  377. { "name": "groups", "type": "int32", "default": 1 },
  378. { "name": "xnor", "type": "int32", "default": 0 },
  379. { "name": "shortcut", "default": 0 },
  380. { "name": "logistic", "default": 0 },
  381. { "name": "batch_normalize", "type": "int32", "default": 0 }
  382. ]
  383. },
  384. {
  385. "name": "route",
  386. "category": "Tensor",
  387. "attributes": [
  388. { "name": "groups_id", "type": "int32", "default": 0 },
  389. { "name": "groups", "type": "int32", "default": 1 }
  390. ]
  391. },
  392. {
  393. "name": "sam",
  394. "category": "Tensor",
  395. "attributes": [
  396. { "name": "activation", "type": "string", "default": "linear", "description": "options are: LOGISTIC, RELU, RELIE, LINEAR, RAMP, TANH, PLSE, LEAKY, ELU, LOGGY, STAIR, HARDTAN, LHTAN, SELU" },
  397. { "name": "from", "description": "This params link the layer to another one, the index of the layer is either positive in which case it's a direct address, if negative it's relative to the layer position" }
  398. ]
  399. },
  400. {
  401. "name": "scale_channels",
  402. "category": "Tensor",
  403. "attributes": [
  404. { "name": "activation", "type": "string", "default": "linear", "description": "options are: LOGISTIC, RELU, RELIE, LINEAR, RAMP, TANH, PLSE, LEAKY, ELU, LOGGY, STAIR, HARDTAN, LHTAN, SELU" },
  405. { "name": "scale_wh", "default": 0 },
  406. { "name": "from", "description": "This params link the layer to another one, the index of the layer is either positive in which case it's a direct address, if negative it's relative to the layer position" }
  407. ]
  408. },
  409. {
  410. "name": "selu",
  411. "category": "Activation"
  412. },
  413. {
  414. "name": "silu",
  415. "category": "Activation"
  416. },
  417. {
  418. "name": "shortcut",
  419. "category": "Tensor",
  420. "attributes": [
  421. { "name": "activation", "type": "string", "default": "logistic", "description": "options are: LOGISTIC, RELU, RELIE, LINEAR, RAMP, TANH, PLSE, LEAKY, ELU, LOGGY, STAIR, HARDTAN, LHTAN, SELU, SWISH, MISH" },
  422. { "name": "assisted_excitation", "default": 0 },
  423. { "name": "from", "description": "This params link the layer to another one, the index of the layer is either positive in which case it's a direct address, if negative it's relative to the layer position" }
  424. ]
  425. },
  426. {
  427. "name": "softmax",
  428. "category": "Activation",
  429. "attributes": [
  430. { "name": "groups", "type": "int32", "default": 1 },
  431. { "name": "temperature", "type": "float32", "default": 1 },
  432. { "name": "tree", "type": "string", "default": 0 },
  433. { "name": "spatial", "type": "int32", "default": 0 },
  434. { "name": "noloss", "type": "int32", "default": 0 }
  435. ]
  436. },
  437. {
  438. "name": "stair",
  439. "category": "Activation"
  440. },
  441. {
  442. "name": "swish",
  443. "category": "Activation"
  444. },
  445. {
  446. "name": "tanh",
  447. "category": "Activation"
  448. },
  449. {
  450. "name": "upsample",
  451. "category": "Shape",
  452. "attributes": [
  453. { "name": "stride", "type": "int32", "default": 2 },
  454. { "name": "scale", "type": "float32", "default": 1 }
  455. ]
  456. },
  457. {
  458. "name": "yolo",
  459. "category": "Layer",
  460. "attributes": [
  461. { "name": "classes", "type": "int32", "default": 20 },
  462. { "name": "num", "type": "int32", "default": 1 },
  463. { "name": "mask", "type": "int32[]", "default": 0 },
  464. { "name": "jitter", "type": "float32", "default": 0.2 },
  465. { "name": "label_smooth_eps", "type": "float32", "default": 0 },
  466. { "name": "scale_x_y", "type": "float32", "default": 1 },
  467. { "name": "iou_normalizer", "type": "float32", "default": 0.75 },
  468. { "name": "cls_normalizer", "type": "float32", "default": 1 },
  469. { "name": "iou_loss", "type": "string", "default": "mse", "description": "options are: mse, giou, diou, and ciou" },
  470. { "name": "focal_loss", "type": "int32", "default": 0 },
  471. { "name": "max", "type": "int32", "default": 90 },
  472. { "name": "ignore_thresh", "type": "float32", "default": 0.5 },
  473. { "name": "truth_thresh", "type": "float32", "default": 1 },
  474. { "name": "iou_thresh", "type": "float32", "default": 1, "description": "recommended to use iou_thresh=0.213" },
  475. { "name": "random", "type": "int32", "default": 0 },
  476. { "name": "map", "type": "string", "default": 0 },
  477. { "name": "nms_kind", "type": "string", "default": "default", "description": "options are: greedynms, diounms, cornersnms, or defaultnms" },
  478. { "name": "anchors", "type": "int32[]", "default": 0 }
  479. ]
  480. }
  481. ]