questions.yaml 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399
  1. groups:
  2. - name: FSCrawler Configuration
  3. description: Configure FSCrawler
  4. - name: Network Configuration
  5. description: Configure Network for FSCrawler
  6. - name: Storage Configuration
  7. description: Configure Storage for FSCrawler
  8. - name: Resources Configuration
  9. description: Configure Resources for FSCrawler
  10. questions:
  11. - variable: TZ
  12. group: FSCrawler Configuration
  13. label: Timezone
  14. schema:
  15. type: string
  16. default: Etc/UTC
  17. required: true
  18. $ref:
  19. - definitions/timezone
  20. - variable: fscrawlerConfig
  21. label: ""
  22. group: FSCrawler Configuration
  23. schema:
  24. type: dict
  25. attrs:
  26. - variable: imageSelector
  27. label: Image
  28. description: |
  29. The image to use for FSCrawler.</br>
  30. Images with OCR support are a lot larger than images without OCR support.</br>
  31. Approximate image sizes:</br>
  32. - With OCR Support: 1.2GB</br>
  33. - Without OCR Support: 0.5GB
  34. schema:
  35. type: string
  36. default: "ocrImage"
  37. required: true
  38. enum:
  39. - value: "ocrImage"
  40. description: With OCR Support - Elasticsearch 7 and 8
  41. - value: "noocrImage"
  42. description: Without OCR Support - Elasticsearch 7 and 8
  43. - variable: jobName
  44. label: Job Name
  45. description: |
  46. The name of the FSCrawler job to run. </br>
  47. A _settings.yaml file in the directory named after the job name will have to be manually created.
  48. schema:
  49. type: string
  50. default: ""
  51. required: true
  52. - variable: loop
  53. label: Loop
  54. description: |
  55. The number of times to run the job.</br>
  56. https://fscrawler.readthedocs.io/en/latest/admin/cli-options.html#loop </br>
  57. -1 means run forever. </br>
  58. 0 means never run. </br>
  59. schema:
  60. type: int
  61. default: -1
  62. required: true
  63. min: -1
  64. - variable: restart
  65. label: Restart
  66. description: |
  67. Restart the job from the beginning.</br>
  68. https://fscrawler.readthedocs.io/en/latest/admin/cli-options.html#restart
  69. schema:
  70. type: boolean
  71. default: false
  72. - variable: additionalEnvs
  73. label: Additional Environment Variables
  74. description: Configure additional environment variables for FSCrawler.
  75. schema:
  76. type: list
  77. default: []
  78. items:
  79. - variable: env
  80. label: Environment Variable
  81. schema:
  82. type: dict
  83. attrs:
  84. - variable: name
  85. label: Name
  86. schema:
  87. type: string
  88. required: true
  89. - variable: value
  90. label: Value
  91. schema:
  92. type: string
  93. required: true
  94. - variable: fscrawlerNetwork
  95. label: ""
  96. group: Network Configuration
  97. schema:
  98. type: dict
  99. attrs:
  100. - variable: enableRestApiService
  101. label: Enable Rest API Service
  102. description: |
  103. Enable Rest API Service for FSCrawler.</br>
  104. https://fscrawler.readthedocs.io/en/latest/admin/fs/rest.html</br>
  105. Additional configuration is needed in the job file. Check the Notes card
  106. after installation for more information.
  107. schema:
  108. type: boolean
  109. default: false
  110. - variable: restPort
  111. label: Rest Port
  112. description: The port to use for the Rest API Service.
  113. schema:
  114. type: int
  115. show_if: [["enableRestApiService", "=", true]]
  116. default: 30084
  117. min: 9000
  118. max: 65535
  119. required: true
  120. - variable: hostNetwork
  121. label: Host Network
  122. description: |
  123. Bind to the host network. It's recommended to keep this disabled.
  124. schema:
  125. type: boolean
  126. default: false
  127. - variable: fscrawlerStorage
  128. label: ""
  129. group: Storage Configuration
  130. schema:
  131. type: dict
  132. attrs:
  133. - variable: jobs
  134. label: FSCrawler Jobs Storage
  135. description: The path to store FSCrawler Jobs.
  136. schema:
  137. type: dict
  138. attrs:
  139. - variable: type
  140. label: Type
  141. description: |
  142. ixVolume: Is dataset created automatically by the system.</br>
  143. Host Path: Is a path that already exists on the system.
  144. schema:
  145. type: string
  146. required: true
  147. immutable: true
  148. default: "ixVolume"
  149. enum:
  150. - value: "hostPath"
  151. description: Host Path (Path that already exists on the system)
  152. - value: "ixVolume"
  153. description: ixVolume (Dataset created automatically by the system)
  154. - variable: ixVolumeConfig
  155. label: ixVolume Configuration
  156. description: The configuration for the ixVolume dataset.
  157. schema:
  158. type: dict
  159. show_if: [["type", "=", "ixVolume"]]
  160. $ref:
  161. - "normalize/ixVolume"
  162. attrs:
  163. - variable: aclEnable
  164. label: Enable ACL
  165. description: Enable ACL for the dataset.
  166. schema:
  167. type: boolean
  168. default: false
  169. - variable: datasetName
  170. label: Dataset Name
  171. description: The name of the dataset to use for storage.
  172. schema:
  173. type: string
  174. required: true
  175. immutable: true
  176. hidden: true
  177. default: "jobs"
  178. - variable: aclEntries
  179. label: ACL Configuration
  180. schema:
  181. type: dict
  182. show_if: [["aclEnable", "=", true]]
  183. attrs: []
  184. - variable: hostPathConfig
  185. label: Host Path Configuration
  186. schema:
  187. type: dict
  188. show_if: [["type", "=", "hostPath"]]
  189. attrs:
  190. - variable: aclEnable
  191. label: Enable ACL
  192. description: Enable ACL for the dataset.
  193. schema:
  194. type: boolean
  195. default: false
  196. - variable: acl
  197. label: ACL Configuration
  198. schema:
  199. type: dict
  200. show_if: [["aclEnable", "=", true]]
  201. attrs: []
  202. $ref:
  203. - "normalize/acl"
  204. - variable: hostPath
  205. label: Host Path
  206. description: The host path to use for storage.
  207. schema:
  208. type: hostpath
  209. show_if: [["aclEnable", "=", false]]
  210. required: true
  211. - variable: additionalStorages
  212. label: Additional Storage
  213. description: Additional storage for FSCrawler.
  214. schema:
  215. type: list
  216. default: []
  217. items:
  218. - variable: storageEntry
  219. label: Storage Entry
  220. schema:
  221. type: dict
  222. attrs:
  223. - variable: type
  224. label: Type
  225. description: |
  226. ixVolume: Is dataset created automatically by the system.</br>
  227. Host Path: Is a path that already exists on the system.</br>
  228. SMB Share: Is a SMB share that is mounted to a persistent volume claim.
  229. schema:
  230. type: string
  231. required: true
  232. default: "ixVolume"
  233. immutable: true
  234. enum:
  235. - value: "hostPath"
  236. description: Host Path (Path that already exists on the system)
  237. - value: "ixVolume"
  238. description: ixVolume (Dataset created automatically by the system)
  239. - value: "smb-pv-pvc"
  240. description: SMB Share (Mounts a persistent volume claim to a SMB share)
  241. - variable: readOnly
  242. label: Read Only
  243. description: Mount the volume as read only.
  244. schema:
  245. type: boolean
  246. default: false
  247. - variable: mountPath
  248. label: Mount Path
  249. description: The path inside the container to mount the storage.
  250. schema:
  251. type: path
  252. required: true
  253. - variable: hostPathConfig
  254. label: Host Path Configuration
  255. schema:
  256. type: dict
  257. show_if: [["type", "=", "hostPath"]]
  258. attrs:
  259. - variable: aclEnable
  260. label: Enable ACL
  261. description: Enable ACL for the dataset.
  262. schema:
  263. type: boolean
  264. default: false
  265. - variable: acl
  266. label: ACL Configuration
  267. schema:
  268. type: dict
  269. show_if: [["aclEnable", "=", true]]
  270. attrs: []
  271. $ref:
  272. - "normalize/acl"
  273. - variable: hostPath
  274. label: Host Path
  275. description: The host path to use for storage.
  276. schema:
  277. type: hostpath
  278. show_if: [["aclEnable", "=", false]]
  279. required: true
  280. - variable: ixVolumeConfig
  281. label: ixVolume Configuration
  282. description: The configuration for the ixVolume dataset.
  283. schema:
  284. type: dict
  285. show_if: [["type", "=", "ixVolume"]]
  286. $ref:
  287. - "normalize/ixVolume"
  288. attrs:
  289. - variable: aclEnable
  290. label: Enable ACL
  291. description: Enable ACL for the dataset.
  292. schema:
  293. type: boolean
  294. default: false
  295. - variable: datasetName
  296. label: Dataset Name
  297. description: The name of the dataset to use for storage.
  298. schema:
  299. type: string
  300. required: true
  301. immutable: true
  302. default: "storage_entry"
  303. - variable: aclEntries
  304. label: ACL Configuration
  305. schema:
  306. type: dict
  307. show_if: [["aclEnable", "=", true]]
  308. attrs: []
  309. - variable: smbConfig
  310. label: SMB Share Configuration
  311. description: The configuration for the SMB Share.
  312. schema:
  313. type: dict
  314. show_if: [["type", "=", "smb-pv-pvc"]]
  315. attrs:
  316. - variable: server
  317. label: Server
  318. description: The server for the SMB share.
  319. schema:
  320. type: string
  321. required: true
  322. - variable: share
  323. label: Share
  324. description: The share name for the SMB share.
  325. schema:
  326. type: string
  327. required: true
  328. - variable: domain
  329. label: Domain (Optional)
  330. description: The domain for the SMB share.
  331. schema:
  332. type: string
  333. - variable: username
  334. label: Username
  335. description: The username for the SMB share.
  336. schema:
  337. type: string
  338. required: true
  339. - variable: password
  340. label: Password
  341. description: The password for the SMB share.
  342. schema:
  343. type: string
  344. required: true
  345. private: true
  346. - variable: size
  347. label: Size (in Gi)
  348. description: The size of the volume quota.
  349. schema:
  350. type: int
  351. required: true
  352. min: 1
  353. default: 1
  354. - variable: resources
  355. group: Resources Configuration
  356. label: ""
  357. schema:
  358. type: dict
  359. attrs:
  360. - variable: limits
  361. label: Limits
  362. schema:
  363. type: dict
  364. attrs:
  365. - variable: cpu
  366. label: CPU
  367. description: CPU limit for FSCrawler.
  368. schema:
  369. type: string
  370. max_length: 6
  371. valid_chars: '^(0\.[1-9]|[1-9][0-9]*)(\.[0-9]|m?)$'
  372. valid_chars_error: |
  373. Valid CPU limit formats are</br>
  374. - Plain Integer - eg. 1</br>
  375. - Float - eg. 0.5</br>
  376. - Milicpu - eg. 500m
  377. default: "4000m"
  378. required: true
  379. - variable: memory
  380. label: Memory
  381. description: Memory limit for FSCrawler.
  382. schema:
  383. type: string
  384. max_length: 12
  385. valid_chars: '^[1-9][0-9]*([EPTGMK]i?|e[0-9]+)?$'
  386. valid_chars_error: |
  387. Valid Memory limit formats are</br>
  388. - Suffixed with E/P/T/G/M/K - eg. 1G</br>
  389. - Suffixed with Ei/Pi/Ti/Gi/Mi/Ki - eg. 1Gi</br>
  390. - Plain Integer in bytes - eg. 1024</br>
  391. - Exponent - eg. 134e6
  392. default: "8Gi"
  393. required: true