_settings.json 4.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214
  1. {
  2. "settings": {
  3. "number_of_shards": 1,
  4. "index.mapping.total_fields.limit": 2000,
  5. "analysis": {
  6. "analyzer": {
  7. "fscrawler_path": {
  8. "tokenizer": "fscrawler_path"
  9. }
  10. },
  11. "tokenizer": {
  12. "fscrawler_path": {
  13. "type": "path_hierarchy"
  14. }
  15. }
  16. }
  17. },
  18. "mappings": {
  19. "dynamic_templates": [
  20. {
  21. "raw_as_text": {
  22. "path_match": "meta.raw.*",
  23. "mapping": {
  24. "type": "text",
  25. "fields": {
  26. "keyword": {
  27. "type": "keyword",
  28. "ignore_above": 256
  29. }
  30. }
  31. }
  32. }
  33. }
  34. ],
  35. "properties": {
  36. "attachment": {
  37. "type": "binary",
  38. "doc_values": false
  39. },
  40. "attributes": {
  41. "properties": {
  42. "group": {
  43. "type": "keyword"
  44. },
  45. "owner": {
  46. "type": "keyword"
  47. }
  48. }
  49. },
  50. "content": {
  51. "type": "text"
  52. },
  53. "file": {
  54. "properties": {
  55. "content_type": {
  56. "type": "keyword"
  57. },
  58. "filename": {
  59. "type": "keyword",
  60. "store": true
  61. },
  62. "extension": {
  63. "type": "keyword"
  64. },
  65. "filesize": {
  66. "type": "long"
  67. },
  68. "indexed_chars": {
  69. "type": "long"
  70. },
  71. "indexing_date": {
  72. "type": "date",
  73. "format": "dateOptionalTime"
  74. },
  75. "created": {
  76. "type": "date",
  77. "format": "dateOptionalTime"
  78. },
  79. "last_modified": {
  80. "type": "date",
  81. "format": "dateOptionalTime"
  82. },
  83. "last_accessed": {
  84. "type": "date",
  85. "format": "dateOptionalTime"
  86. },
  87. "checksum": {
  88. "type": "keyword"
  89. },
  90. "url": {
  91. "type": "keyword",
  92. "index": false
  93. }
  94. }
  95. },
  96. "meta": {
  97. "properties": {
  98. "author": {
  99. "type": "text"
  100. },
  101. "date": {
  102. "type": "date",
  103. "format": "dateOptionalTime"
  104. },
  105. "keywords": {
  106. "type": "text"
  107. },
  108. "title": {
  109. "type": "text"
  110. },
  111. "language": {
  112. "type": "keyword"
  113. },
  114. "format": {
  115. "type": "text"
  116. },
  117. "identifier": {
  118. "type": "text"
  119. },
  120. "contributor": {
  121. "type": "text"
  122. },
  123. "coverage": {
  124. "type": "text"
  125. },
  126. "modifier": {
  127. "type": "text"
  128. },
  129. "creator_tool": {
  130. "type": "keyword"
  131. },
  132. "publisher": {
  133. "type": "text"
  134. },
  135. "relation": {
  136. "type": "text"
  137. },
  138. "rights": {
  139. "type": "text"
  140. },
  141. "source": {
  142. "type": "text"
  143. },
  144. "type": {
  145. "type": "text"
  146. },
  147. "description": {
  148. "type": "text"
  149. },
  150. "created": {
  151. "type": "date",
  152. "format": "dateOptionalTime"
  153. },
  154. "print_date": {
  155. "type": "date",
  156. "format": "dateOptionalTime"
  157. },
  158. "metadata_date": {
  159. "type": "date",
  160. "format": "dateOptionalTime"
  161. },
  162. "latitude": {
  163. "type": "text"
  164. },
  165. "longitude": {
  166. "type": "text"
  167. },
  168. "altitude": {
  169. "type": "text"
  170. },
  171. "rating": {
  172. "type": "byte"
  173. },
  174. "comments": {
  175. "type": "text"
  176. }
  177. }
  178. },
  179. "path": {
  180. "properties": {
  181. "real": {
  182. "type": "keyword",
  183. "fields": {
  184. "tree": {
  185. "type": "text",
  186. "analyzer": "fscrawler_path",
  187. "fielddata": true
  188. },
  189. "fulltext": {
  190. "type": "text"
  191. }
  192. }
  193. },
  194. "root": {
  195. "type": "keyword"
  196. },
  197. "virtual": {
  198. "type": "keyword",
  199. "fields": {
  200. "tree": {
  201. "type": "text",
  202. "analyzer": "fscrawler_path",
  203. "fielddata": true
  204. },
  205. "fulltext": {
  206. "type": "text"
  207. }
  208. }
  209. }
  210. }
  211. }
  212. }
  213. }
  214. }