libis-format 0.9.5-java

Sign up to get free protection for your applications and to get access to all the features.
Files changed (207) hide show
  1. checksums.yaml +7 -0
  2. data/.coveralls.yml +2 -0
  3. data/.gitignore +18 -0
  4. data/.travis.yml +41 -0
  5. data/Gemfile +5 -0
  6. data/LICENSE.txt +22 -0
  7. data/README.md +39 -0
  8. data/Rakefile +8 -0
  9. data/bin/droid +15 -0
  10. data/bin/fido +12 -0
  11. data/bin/pdf_copy +13 -0
  12. data/data/ISOcoated_v2_eci.icc +0 -0
  13. data/data/PDFA_def.ps +40 -0
  14. data/data/ead.xsd +2728 -0
  15. data/data/eciRGB_v2.icc +0 -0
  16. data/data/lias_formats.xml +106 -0
  17. data/data/types.yml +217 -0
  18. data/lib/libis/format/config.rb +35 -0
  19. data/lib/libis/format/converter/base.rb +101 -0
  20. data/lib/libis/format/converter/chain.rb +167 -0
  21. data/lib/libis/format/converter/image_converter.rb +214 -0
  22. data/lib/libis/format/converter/office_converter.rb +50 -0
  23. data/lib/libis/format/converter/pdf_converter.rb +139 -0
  24. data/lib/libis/format/converter/repository.rb +98 -0
  25. data/lib/libis/format/converter.rb +11 -0
  26. data/lib/libis/format/droid.rb +45 -0
  27. data/lib/libis/format/fido.rb +102 -0
  28. data/lib/libis/format/identifier.rb +189 -0
  29. data/lib/libis/format/office_to_pdf.rb +52 -0
  30. data/lib/libis/format/pdf_copy.rb +40 -0
  31. data/lib/libis/format/pdf_merge.rb +41 -0
  32. data/lib/libis/format/pdf_split.rb +39 -0
  33. data/lib/libis/format/pdf_to_pdfa.rb +76 -0
  34. data/lib/libis/format/pdfa_validator.rb +61 -0
  35. data/lib/libis/format/type_database.rb +170 -0
  36. data/lib/libis/format/version.rb +5 -0
  37. data/lib/libis/format.rb +23 -0
  38. data/lib/libis-format.rb +1 -0
  39. data/libis-format.gemspec +34 -0
  40. data/spec/converter_spec.rb +212 -0
  41. data/spec/data/Cevennes2.bmp +0 -0
  42. data/spec/data/Cevennes2.jp2 +0 -0
  43. data/spec/data/Cevennes2.ppm +22492 -0
  44. data/spec/data/test-ead.xml +392 -0
  45. data/spec/data/test-jpg.tif +0 -0
  46. data/spec/data/test-lzw.tif +0 -0
  47. data/spec/data/test-options.jpg +0 -0
  48. data/spec/data/test.bmp +0 -0
  49. data/spec/data/test.doc +0 -0
  50. data/spec/data/test.docx +0 -0
  51. data/spec/data/test.gif +0 -0
  52. data/spec/data/test.jpg +0 -0
  53. data/spec/data/test.ods +0 -0
  54. data/spec/data/test.odt +0 -0
  55. data/spec/data/test.pdf +0 -0
  56. data/spec/data/test.pdf.tif +0 -0
  57. data/spec/data/test.png +0 -0
  58. data/spec/data/test.ps +8631 -0
  59. data/spec/data/test.psd +0 -0
  60. data/spec/data/test.rtf +1455 -0
  61. data/spec/data/test.tif +0 -0
  62. data/spec/data/test.txt +12 -0
  63. data/spec/data/test.xcf +0 -0
  64. data/spec/data/test.xls +0 -0
  65. data/spec/data/test.xlsx +0 -0
  66. data/spec/data/test.xml +4 -0
  67. data/spec/data/test_pdfa.pdf +0 -0
  68. data/spec/identifier_spec.rb +60 -0
  69. data/spec/spec_helper.rb +9 -0
  70. data/spec/test_types.yml +12 -0
  71. data/spec/type_database_spec.rb +140 -0
  72. data/tools/PdfTool.jar +0 -0
  73. data/tools/bcpkix-jdk15on-1.49.jar +0 -0
  74. data/tools/bcprov-jdk15on-1.49.jar +0 -0
  75. data/tools/droid/DROID_SignatureFile_V82.xml +32681 -0
  76. data/tools/droid/container-signature-20150307.xml +2235 -0
  77. data/tools/droid/droid-command-line-6.1.5.jar +0 -0
  78. data/tools/droid/droid.bat +154 -0
  79. data/tools/droid/droid.sh +138 -0
  80. data/tools/droid/lib/XmlSchema-1.4.7.jar +0 -0
  81. data/tools/droid/lib/activation-1.1.jar +0 -0
  82. data/tools/droid/lib/antlr-2.7.7.jar +0 -0
  83. data/tools/droid/lib/antlr-3.2.jar +0 -0
  84. data/tools/droid/lib/antlr-runtime-3.2.jar +0 -0
  85. data/tools/droid/lib/aopalliance-1.0.jar +0 -0
  86. data/tools/droid/lib/asm-2.2.3.jar +0 -0
  87. data/tools/droid/lib/aspectjrt-1.7.2.jar +0 -0
  88. data/tools/droid/lib/aspectjweaver-1.7.2.jar +0 -0
  89. data/tools/droid/lib/bcmail-jdk14-138.jar +0 -0
  90. data/tools/droid/lib/bcprov-jdk14-138.jar +0 -0
  91. data/tools/droid/lib/beansbinding-1.2.1.jar +0 -0
  92. data/tools/droid/lib/byteseek-1.1.1.jar +0 -0
  93. data/tools/droid/lib/cglib-nodep-2.2.2.jar +0 -0
  94. data/tools/droid/lib/classmate-1.0.0.jar +0 -0
  95. data/tools/droid/lib/commons-cli-1.2.jar +0 -0
  96. data/tools/droid/lib/commons-codec-1.4.jar +0 -0
  97. data/tools/droid/lib/commons-collections-3.2.1.jar +0 -0
  98. data/tools/droid/lib/commons-compress-1.4.1.jar +0 -0
  99. data/tools/droid/lib/commons-configuration-1.8.jar +0 -0
  100. data/tools/droid/lib/commons-dbcp-1.4.jar +0 -0
  101. data/tools/droid/lib/commons-httpclient-3.1.jar +0 -0
  102. data/tools/droid/lib/commons-io-2.4.jar +0 -0
  103. data/tools/droid/lib/commons-lang-2.6.jar +0 -0
  104. data/tools/droid/lib/commons-logging-1.1.1.jar +0 -0
  105. data/tools/droid/lib/commons-pool-1.5.4.jar +0 -0
  106. data/tools/droid/lib/cxf-api-2.2.12.jar +0 -0
  107. data/tools/droid/lib/cxf-common-schemas-2.2.12.jar +0 -0
  108. data/tools/droid/lib/cxf-common-utilities-2.2.12.jar +0 -0
  109. data/tools/droid/lib/cxf-rt-bindings-http-2.2.12.jar +0 -0
  110. data/tools/droid/lib/cxf-rt-bindings-soap-2.2.12.jar +0 -0
  111. data/tools/droid/lib/cxf-rt-bindings-xml-2.2.12.jar +0 -0
  112. data/tools/droid/lib/cxf-rt-core-2.2.12.jar +0 -0
  113. data/tools/droid/lib/cxf-rt-databinding-jaxb-2.2.12.jar +0 -0
  114. data/tools/droid/lib/cxf-rt-frontend-jaxws-2.2.12.jar +0 -0
  115. data/tools/droid/lib/cxf-rt-frontend-simple-2.2.12.jar +0 -0
  116. data/tools/droid/lib/cxf-rt-transports-http-2.2.12.jar +0 -0
  117. data/tools/droid/lib/cxf-rt-ws-addr-2.2.12.jar +0 -0
  118. data/tools/droid/lib/cxf-tools-common-2.2.12.jar +0 -0
  119. data/tools/droid/lib/de.huxhorn.lilith.3rdparty.flyingsaucer.core-renderer-8RC1.jar +0 -0
  120. data/tools/droid/lib/derby-10.10.2.0.jar +0 -0
  121. data/tools/droid/lib/dom4j-1.6.1.jar +0 -0
  122. data/tools/droid/lib/droid-container-6.1.5.jar +0 -0
  123. data/tools/droid/lib/droid-core-6.1.5.jar +0 -0
  124. data/tools/droid/lib/droid-core-interfaces-6.1.5.jar +0 -0
  125. data/tools/droid/lib/droid-export-6.1.5.jar +0 -0
  126. data/tools/droid/lib/droid-export-interfaces-6.1.5.jar +0 -0
  127. data/tools/droid/lib/droid-help-6.1.5.jar +0 -0
  128. data/tools/droid/lib/droid-report-6.1.5.jar +0 -0
  129. data/tools/droid/lib/droid-report-interfaces-6.1.5.jar +0 -0
  130. data/tools/droid/lib/droid-results-6.1.5.jar +0 -0
  131. data/tools/droid/lib/ejb3-persistence-1.0.2.GA.jar +0 -0
  132. data/tools/droid/lib/geronimo-activation_1.1_spec-1.0.2.jar +0 -0
  133. data/tools/droid/lib/geronimo-annotation_1.0_spec-1.1.1.jar +0 -0
  134. data/tools/droid/lib/geronimo-javamail_1.4_spec-1.6.jar +0 -0
  135. data/tools/droid/lib/geronimo-jaxws_2.1_spec-1.0.jar +0 -0
  136. data/tools/droid/lib/geronimo-stax-api_1.0_spec-1.0.1.jar +0 -0
  137. data/tools/droid/lib/geronimo-ws-metadata_2.0_spec-1.1.2.jar +0 -0
  138. data/tools/droid/lib/hibernate-commons-annotations-4.0.4.Final.jar +0 -0
  139. data/tools/droid/lib/hibernate-core-4.3.5.Final.jar +0 -0
  140. data/tools/droid/lib/hibernate-entitymanager-4.3.5.Final.jar +0 -0
  141. data/tools/droid/lib/hibernate-jpa-2.1-api-1.0.0.Final.jar +0 -0
  142. data/tools/droid/lib/hibernate-validator-5.1.0.Final.jar +0 -0
  143. data/tools/droid/lib/itext-2.0.8.jar +0 -0
  144. data/tools/droid/lib/jandex-1.1.0.Final.jar +0 -0
  145. data/tools/droid/lib/javahelp-2.0.05.jar +0 -0
  146. data/tools/droid/lib/javassist-3.18.1-GA.jar +0 -0
  147. data/tools/droid/lib/jaxb-api-2.1.jar +0 -0
  148. data/tools/droid/lib/jaxb-impl-2.1.13.jar +0 -0
  149. data/tools/droid/lib/jboss-logging-3.1.3.GA.jar +0 -0
  150. data/tools/droid/lib/jboss-logging-annotations-1.2.0.Beta1.jar +0 -0
  151. data/tools/droid/lib/jboss-transaction-api_1.2_spec-1.0.0.Final.jar +0 -0
  152. data/tools/droid/lib/joda-time-1.6.2.jar +0 -0
  153. data/tools/droid/lib/jra-1.0-alpha-4.jar +0 -0
  154. data/tools/droid/lib/jta-1.1.jar +0 -0
  155. data/tools/droid/lib/log4j-1.2.13.jar +0 -0
  156. data/tools/droid/lib/neethi-2.0.4.jar +0 -0
  157. data/tools/droid/lib/opencsv-2.3.jar +0 -0
  158. data/tools/droid/lib/org-netbeans-swing-outline-7.2.jar +0 -0
  159. data/tools/droid/lib/org-openide-util-7.2.jar +0 -0
  160. data/tools/droid/lib/org-openide-util-lookup-7.2.jar +0 -0
  161. data/tools/droid/lib/poi-3.7.jar +0 -0
  162. data/tools/droid/lib/saaj-api-1.3.jar +0 -0
  163. data/tools/droid/lib/saaj-impl-1.3.2.jar +0 -0
  164. data/tools/droid/lib/slf4j-api-1.4.2.jar +0 -0
  165. data/tools/droid/lib/slf4j-log4j12-1.4.2.jar +0 -0
  166. data/tools/droid/lib/spring-aop-4.0.3.RELEASE.jar +0 -0
  167. data/tools/droid/lib/spring-beans-4.0.3.RELEASE.jar +0 -0
  168. data/tools/droid/lib/spring-context-4.0.3.RELEASE.jar +0 -0
  169. data/tools/droid/lib/spring-core-4.0.3.RELEASE.jar +0 -0
  170. data/tools/droid/lib/spring-expression-4.0.3.RELEASE.jar +0 -0
  171. data/tools/droid/lib/spring-jdbc-4.0.3.RELEASE.jar +0 -0
  172. data/tools/droid/lib/spring-orm-4.0.3.RELEASE.jar +0 -0
  173. data/tools/droid/lib/spring-tx-4.0.3.RELEASE.jar +0 -0
  174. data/tools/droid/lib/spring-web-2.5.6.jar +0 -0
  175. data/tools/droid/lib/stax-api-1.0-2.jar +0 -0
  176. data/tools/droid/lib/stringtemplate-3.2.jar +0 -0
  177. data/tools/droid/lib/truezip-6.8.4.jar +0 -0
  178. data/tools/droid/lib/validation-api-1.1.0.Final.jar +0 -0
  179. data/tools/droid/lib/wsdl4j-1.6.2.jar +0 -0
  180. data/tools/droid/lib/wstx-asl-3.2.9.jar +0 -0
  181. data/tools/droid/lib/xercesImpl-2.9.1.jar +0 -0
  182. data/tools/droid/lib/xml-apis-1.3.04.jar +0 -0
  183. data/tools/droid/lib/xml-resolver-1.2.jar +0 -0
  184. data/tools/droid/lib/xz-1.0.jar +0 -0
  185. data/tools/fido/__init__.py +0 -0
  186. data/tools/fido/argparselocal.py +2355 -0
  187. data/tools/fido/conf/DROID_SignatureFile-v81.xml +2 -0
  188. data/tools/fido/conf/container-signature-20150307.xml +2238 -0
  189. data/tools/fido/conf/dc.xsd +119 -0
  190. data/tools/fido/conf/dcmitype.xsd +53 -0
  191. data/tools/fido/conf/dcterms.xsd +383 -0
  192. data/tools/fido/conf/fido-formats.xsd +173 -0
  193. data/tools/fido/conf/format_extension_template.xml +105 -0
  194. data/tools/fido/conf/format_extensions.xml +498 -0
  195. data/tools/fido/conf/formats-v81.xml +38355 -0
  196. data/tools/fido/conf/pronom-xml-v81.zip +0 -0
  197. data/tools/fido/conf/versions.xml +8 -0
  198. data/tools/fido/fido.bat +4 -0
  199. data/tools/fido/fido.py +854 -0
  200. data/tools/fido/fido.sh +5 -0
  201. data/tools/fido/prepare.py +616 -0
  202. data/tools/fido/pronomutils.py +115 -0
  203. data/tools/fido/toxml.py +52 -0
  204. data/tools/fido/update_signatures.py +171 -0
  205. data/tools/pdfbox/pdfbox-app-1.8.10.jar +0 -0
  206. data/tools/pdfbox/preflight-app-1.8.10.jar +0 -0
  207. metadata +396 -0
@@ -0,0 +1,498 @@
1
+ <?xml version="1.0"?>
2
+ <formats xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dcterms="http://purl.org/dc/terms/" xsi:noNamespaceSchemaLocation="fido-formats.xsd" version="0.3">
3
+ <format>
4
+ <puid>fido-fmt/189.word</puid>
5
+ <name>Microsoft Office Open XML - Word</name>
6
+ <extension>docx</extension>
7
+ <has_priority_over>x-fmt/263</has_priority_over>
8
+ <has_priority_over>fmt/189</has_priority_over>
9
+ <signature>
10
+ <name>Microsoft Office Open XML - Word</name>
11
+ <pattern>
12
+ <position>BOF</position>
13
+ <regex>(?s)\APK\x03\x04</regex>
14
+ </pattern>
15
+ <pattern>
16
+ <position>BOF</position>
17
+ <regex>(?s)\A.{30}\[Content_Types\]\.xml \xa2</regex>
18
+ </pattern>
19
+ <pattern>
20
+ <position>EOF</position>
21
+ <regex>(?s)\x00\x00word/.{1,20}\.xmlPK\x01\x02\x2d.{0,2000}\Z</regex>
22
+ </pattern>
23
+ </signature>
24
+ </format>
25
+ <format>
26
+ <puid>fido-fmt/189.xl</puid>
27
+ <name>Microsoft Office Open XML - Excel</name>
28
+ <extension>xlsx</extension>
29
+ <has_priority_over>x-fmt/263</has_priority_over>
30
+ <has_priority_over>fmt/189</has_priority_over>
31
+ <signature>
32
+ <name>Microsoft Office Open XML - Excel</name>
33
+ <pattern>
34
+ <position>BOF</position>
35
+ <regex>(?s)\APK\x03\x04</regex>
36
+ </pattern>
37
+ <pattern>
38
+ <position>BOF</position>
39
+ <regex>(?s)\A.{30}\[Content_Types\]\.xml \xa2</regex>
40
+ </pattern>
41
+ <pattern>
42
+ <position>EOF</position>
43
+ <regex>(?s)\x00xl/.{1,20}\.xmlPK\x01\x02\x2d.{0,2000}\Z</regex>
44
+ </pattern>
45
+ </signature>
46
+ </format>
47
+ <format>
48
+ <puid>fido-fmt/189.ppt</puid>
49
+ <name>Microsoft Office Open XML - Powerpoint</name>
50
+ <extension>pptx</extension>
51
+ <has_priority_over>x-fmt/263</has_priority_over>
52
+ <has_priority_over>fmt/189</has_priority_over>
53
+ <signature>
54
+ <name>Microsoft Office Open XML - Powerpoint</name>
55
+ <pattern>
56
+ <position>BOF</position>
57
+ <regex>(?s)\APK\x03\x04</regex>
58
+ </pattern>
59
+ <pattern>
60
+ <position>BOF</position>
61
+ <regex>(?s)\A.{30}\[Content_Types\]\.xml \xa2</regex>
62
+ </pattern>
63
+ <pattern>
64
+ <position>EOF</position>
65
+ <!-- ppt/presentation.xml might be better, but it can be far from the end. -->
66
+ <regex>(?s)\x00ppt/.{1,20}\.xmlPK\x01\x02\x2d.{0,2000}\Z</regex>
67
+ </pattern>
68
+ </signature>
69
+ </format>
70
+ <format>
71
+ <puid>fmt/134</puid>
72
+ <mime>audio/mpeg</mime>
73
+ <name>MPEG 1/2 Audio Layer 3 - fido update</name>
74
+ <pronom_id>687</pronom_id>
75
+ <extension>mp3</extension>
76
+ <signature>
77
+ <name>MPEG-1/2 Audio Layer 3</name>
78
+ <note>The pronom signatures for fmt/134 were horrendous. This is an attempt to consolidate several
79
+ nearly identical patterns into one. It is not clear if they should be BOF or EOF or both.
80
+ Regularly-spaced frame headers should always be discoverable near EOF. An ID3v1
81
+ tag of up to 355 bytes may be present at EOF.</note>
82
+ <pattern>
83
+ <position>EOF</position>
84
+ <regex>(?s)\xff[\xfa\xfb\xf2\xf3][\x10-\xeb].{46,1439}\xff[\xfa\xfb\xf2\xf3][\x10-\xeb].{46,1439}\Z</regex>
85
+ </pattern>
86
+ <pattern>
87
+ <position>BOF</position>
88
+ <pronom_pattern>494433</pronom_pattern>
89
+ <regex>(?s)\AID3</regex>
90
+ </pattern>
91
+ </signature>
92
+ </format>
93
+ <format>
94
+ <puid>fido-x-fmt/384</puid>
95
+ <mime>video/quicktime</mime>
96
+ <name>Quicktime</name>
97
+ <extension>mov</extension>
98
+ <signature>
99
+ <name>QuickTime</name>
100
+ <note>Simple addition to cover the case in the fido test suite. Needs research to correct and merge with x-fmt/384</note>
101
+ <pattern>
102
+ <position>BOF</position>
103
+ <regex>(?s)\A\x00{3} ftypqt.{0,25}qt.{0,20}moov.{4}mvhd</regex>
104
+ </pattern>
105
+ </signature>
106
+ </format>
107
+ <format>
108
+ <puid>fmt/40</puid>
109
+ <mime>application/msword</mime>
110
+ <name>Microsoft Word for Windows Document</name>
111
+ <pronom_id>690</pronom_id>
112
+ <extension>doc</extension>
113
+ <has_priority_over>fmt/111</has_priority_over>
114
+ <signature>
115
+ <name>Microsoft Word for Windows 97 - 2002</name>
116
+ <note>2010.12 - AF: Some of my test files do not have 8.0, but 97-2003.</note>
117
+ <note>Compound document header + WordDocument user stream + version number</note>
118
+ <pattern>
119
+ <position>BOF</position>
120
+ <pronom_pattern>D0CF11E0A1B11AE1{20}FEFF</pronom_pattern>
121
+ <regex>(?s)\A\xd0\xcf\x11\xe0\xa1\xb1\x1a\xe1.{20}\xfe\xff</regex>
122
+ </pattern>
123
+ <pattern>
124
+ <position>VAR</position>
125
+ <pronom_pattern>57006F007200640044006F00630075006D0065006E007400{42}02(00|01)</pronom_pattern>
126
+ <regex>(?s)W\x00o\x00r\x00d\x00D\x00o\x00c\x00u\x00m\x00e\x00n\x00t\x00.{42}\x02(?:\x00|\x01)</regex>
127
+ </pattern>
128
+ <pattern>
129
+ <position>VAR</position>
130
+ <pronom_pattern>4D6963726F736F667420576F7264(20382E30|20392E30|2031302E30|2D446F6B756D656E74)</pronom_pattern>
131
+ <regex>(?s)Microsoft (?:Office Word|Word)(?: 8\.0| 9\.0| 10\.0|-Dokument| 97-2003)</regex>
132
+ </pattern>
133
+ </signature>
134
+ </format>
135
+ <!-- RTF -->
136
+ <format>
137
+ <puid>fmt/45</puid>
138
+ <mime>application/rtf</mime>
139
+ <mime>text/rtf</mime>
140
+ <name>Rich Text Format</name>
141
+ <pronom_id>626</pronom_id>
142
+ <extension>rtf</extension>
143
+ <signature>
144
+ <name>RTF 1.0 - 1.4 (generic)</name>
145
+ <note>Pronom has FIVE RTF formats (fmt/45-49) with identical patterns that don't match my sample.</note>
146
+ <pattern>
147
+ <position>BOF</position>
148
+ <pronom_pattern>7B5C7274(66|6631)5C(616E7369|6D6163|7063|706361)</pronom_pattern>
149
+ <regex>(?s)\A\{\\rt(?:f|f1)\\(?:adeflang1025|ansi|mac|pc|pca)</regex>
150
+ </pattern>
151
+ </signature>
152
+ </format>
153
+ <format>
154
+ <puid>fmt/46</puid>
155
+ <mime>application/rtf</mime>
156
+ <mime>text/rtf</mime>
157
+ <name>Rich Text Format</name>
158
+ <pronom_id>627</pronom_id>
159
+ <extension>rtf</extension>
160
+ <signature>
161
+ <name>RTF 1.0 - 1.4 (generic)</name>
162
+ <note>\rtf control word</note>
163
+ <pattern>
164
+ <position>BOF</position>
165
+ <pronom_pattern>7B5C7274(66|6631)5C(616E7369|6D6163|7063|706361)</pronom_pattern>
166
+ <!-- HACK. This should fail any non-empty buffer. All of the RTF signatures have the same pattern.
167
+ This version of fido does not have a 'delete' method.
168
+ -->
169
+ <regex>\A\Z</regex>
170
+ </pattern>
171
+ </signature>
172
+ </format>
173
+ <format>
174
+ <puid>fmt/47</puid>
175
+ <mime>application/rtf</mime>
176
+ <mime>text/rtf</mime>
177
+ <name>Rich Text Format</name>
178
+ <pronom_id>628</pronom_id>
179
+ <extension>rtf</extension>
180
+ <signature>
181
+ <name>RTF 1.0 - 1.4 (generic)</name>
182
+ <note>\rtf control word</note>
183
+ <pattern>
184
+ <position>BOF</position>
185
+ <pronom_pattern>7B5C7274(66|6631)5C(616E7369|6D6163|7063|706361)</pronom_pattern>
186
+ <regex>\A\Z</regex>
187
+ </pattern>
188
+ </signature>
189
+ </format>
190
+ <format>
191
+ <puid>fmt/48</puid>
192
+ <mime>application/rtf</mime>
193
+ <mime>text/rtf</mime>
194
+ <name>Rich Text Format</name>
195
+ <pronom_id>629</pronom_id>
196
+ <extension>rtf</extension>
197
+ <signature>
198
+ <name>RTF 1.0 - 1.4 (generic)</name>
199
+ <note>\rtf control word</note>
200
+ <pattern>
201
+ <position>BOF</position>
202
+ <pronom_pattern>7B5C7274(66|6631)5C(616E7369|6D6163|7063|706361)</pronom_pattern>
203
+ <regex>\A\Z</regex>
204
+ </pattern>
205
+ </signature>
206
+ </format>
207
+ <format>
208
+ <puid>fmt/49</puid>
209
+ <mime>application/rtf</mime>
210
+ <mime>text/rtf</mime>
211
+ <name>Rich Text Format</name>
212
+ <pronom_id>630</pronom_id>
213
+ <extension>rtf</extension>
214
+ <signature>
215
+ <name>RTF 1.0 - 1.4 (generic)</name>
216
+ <note>\rtf control word</note>
217
+ <pattern>
218
+ <position>BOF</position>
219
+ <pronom_pattern>7B5C7274(66|6631)5C(616E7369|6D6163|7063|706361)</pronom_pattern>
220
+ <regex>\A\Z</regex>
221
+ </pattern>
222
+ </signature>
223
+ </format>
224
+ <format>
225
+ <!-- .cayra format added by <maurice.de.rooij@nationaalarchief.nl> -->
226
+ <puid>fido-fmt/cayra</puid>
227
+ <name>Intalev Cayra Mindmap file</name>
228
+ <extension>cayra</extension>
229
+ <has_priority_over>x-fmt/263</has_priority_over>
230
+ <signature>
231
+ <name>Intalev Cayra Mindmap file</name>
232
+ <pattern>
233
+ <position>BOF</position>
234
+ <regex>(?s)\APK\x03\x04</regex>
235
+ </pattern>
236
+ <pattern>
237
+ <position>BOF</position>
238
+ <regex>(?s)\A.{30}bin\/[a-z0-9]{8}\-[a-z0-9]{4}\-[a-z0-9]{4}\-[a-z0-9]{4}\-[a-z0-9]{12}\x20\xa2</regex>
239
+ </pattern>
240
+ <pattern>
241
+ <position>EOF</position>
242
+ <regex>(?s)\[Content_Types\]\.xmlPK\x05\x06\x00.{17}\Z</regex>
243
+ </pattern>
244
+ </signature>
245
+ </format>
246
+ <format>
247
+ <!-- .py format added by <maurice.de.rooij@nationaalarchief.nl> -->
248
+ <puid>fido-fmt/python</puid>
249
+ <name>Python script file</name>
250
+ <extension>py</extension>
251
+ <signature>
252
+ <name>Python script file</name>
253
+ <pattern>
254
+ <position>BOF</position>
255
+ <regex>(?s)\A.{0,1024}\x23\x21(?:python|\/usr\/local\/bin\/python|\/usr\/bin\/env python)</regex>
256
+ </pattern>
257
+ </signature>
258
+ </format>
259
+ <format>
260
+ <!-- SPSS format added by <maurice.de.rooij@nationaalarchief.nl>, February 2012 -->
261
+ <puid>fido-fmt/SPSS</puid>
262
+ <mime>application/x-spss</mime>
263
+ <name>SPSS file</name>
264
+ <extension>sav</extension>
265
+ <extension>spp</extension>
266
+ <extension>sbs</extension>
267
+ <extension>sps</extension>
268
+ <extension>spo</extension>
269
+ <extension>spv</extension>
270
+ <signature>
271
+ <name>SPSS Statistical Data File</name>
272
+ <pattern>
273
+ <position>BOF</position>
274
+ <regex>(?s)\A\$FL2@\(#\) (IBM SPSS STATISTICS DATA FILE|PASW STATISTICS DATA FILE)</regex>
275
+ </pattern>
276
+ </signature>
277
+ </format>
278
+ <format>
279
+ <!-- NEXUS format added by <maurice.de.rooij@nationaalarchief.nl> @SPRUCE London 2012 -->
280
+ <!-- http://wiki.opf-labs.org/display/SPR/NeXus+Data+Collection+ISIS+-+STFC+-+solution -->
281
+ <puid>fido-fmt/nexus</puid>
282
+ <mime>application/octet-stream</mime>
283
+ <name>Nexus</name>
284
+ <extension>nxs</extension>
285
+ <signature>
286
+ <name>FIDO Nexus Signature</name>
287
+ <pattern>
288
+ <position>BOF</position>
289
+ <regex>(?s)\A\x89\x48\x44\x46\x0d\x0a\x1a\x0a\x00{5}\x08\x08\x00\x04\x00\x10\x00{13}\xff{8}</regex>
290
+ </pattern>
291
+ </signature>
292
+ </format>
293
+ <!-- iPer Advanced Embedded Hypertext format (AEH) -->
294
+ <!-- contributed by L. Hurley and A. Ogier -->
295
+ <format>
296
+ <puid>fido-fmt/aeh</puid>
297
+ <mime>text/html</mime>
298
+ <name>iPer Advanced Embedded Hypertext</name>
299
+ <alias>AEH</alias>
300
+ <extension>aeh</extension>
301
+ <apple_uti>public.data</apple_uti>
302
+ <signature>
303
+ <name>AEH</name>
304
+ <note>at BOF "ALDO"</note>
305
+ <pattern>
306
+ <position>BOF</position>
307
+ <pronom_pattern>414C444F</pronom_pattern>
308
+ <regex>(?s)\AALDO</regex>
309
+ </pattern>
310
+ </signature>
311
+ <note>iPer Advanced Embedded Hypertext is a propietary file format, owned by Visual Vision, and used with the default software HyperPublish applications (formerly iPer), a comprehensive hypermedia publishing program both for Website and CDROM).</note>
312
+ <details>
313
+ <dc:description>iPer Advanced Embedded Hypertext is a propietary file format owned by Visual Vision.</dc:description>
314
+ <dc:creator>Visual Vision</dc:creator>
315
+ <dcterms:publisher>Visual Vision</dcterms:publisher>
316
+ <content_type>hypertext</content_type>
317
+ <reference>
318
+ <dcterms:title>iPer Advanced Embedded Hypertext</dcterms:title>
319
+ <dc:creator>Visual Vision</dc:creator>
320
+ <dc:publisher>Visual Vision</dc:publisher>
321
+ <dcterms:available>1999</dcterms:available>
322
+ <dc:identifier>http://www.visualvision.com/</dc:identifier>
323
+ <dc:description>iPer Advanced Embedded Hypertext is a propietary file format owned by Visual Vision.</dc:description>
324
+ <dc:type>Authoratative</dc:type>
325
+ </reference>
326
+ <record_metadata>
327
+ <status>unknown</status>
328
+ <dc:creator>L. Hurley and A. Ogier</dc:creator>
329
+ <dcterms:created>01 Dec 2011</dcterms:created>
330
+ </record_metadata>
331
+ </details>
332
+ </format>
333
+ <!-- MobiPocket Reader format (MOBI) -->
334
+ <!-- contributed by L. Hurley and A. Ogier -->
335
+ <format>
336
+ <puid>fido-fmt/mobi</puid>
337
+ <mime>application/x-mobipocket-ebook</mime>
338
+ <name>MobiPocket Reader</name>
339
+ <version></version>
340
+ <alias>MOBI</alias>
341
+ <extension>mobi</extension>
342
+ <extension>prc</extension>
343
+ <apple_uti>public.data</apple_uti>
344
+ <signature>
345
+ <name>Mobi</name>
346
+ <note>Header contains BOOK at offset 60 and MOBI at offset 64</note>
347
+ <pattern>
348
+ <position>BOF</position>
349
+ <pronom_pattern>.{60}424F4F4B4D4F4249</pronom_pattern>
350
+ <regex>(?s)\A(\.|\x00){60}BOOKMOBI</regex>
351
+ </pattern>
352
+ </signature>
353
+ <details>
354
+ <dc:description>MOBI is an ebook format created by a French company, MobiPocket Reader, and bought by Amazon in 2005. Since 2005 the mobi standard has not been updated as Amazon has focused all its attention on the azw format, which is based on the mobi format. Mobi has a high and a low compression version, although the low compression version can be used on more e-reader devices. The mobi format was based on the PalmDOC (Palm Database) Format.</dc:description>
355
+ <dcterms:available>2000</dcterms:available>
356
+ <dc:creator>MobiPocket</dc:creator>
357
+ <dcterms:publisher>Amazon.com</dcterms:publisher>
358
+ <record_metadata>
359
+ <status>unknown</status>
360
+ <dc:creator>L. Hurley and A. Ogier</dc:creator>
361
+ <dcterms:created>01 Dec 2011</dcterms:created>
362
+ </record_metadata>
363
+ </details>
364
+ </format>
365
+ <!-- Protein Data Bank format (PDB) -->
366
+ <!-- contributed by L. Hurley and A. Ogier -->
367
+ <format>
368
+ <puid>fido-fmt/x-pdb</puid>
369
+ <mime>chemical/x-pdb</mime>
370
+ <name>Protein Data Bank</name>
371
+ <version>3.30</version>
372
+ <alias>PDB (3.30)</alias>
373
+ <extension>pdb</extension>
374
+ <apple_uti>public.data</apple_uti>
375
+ <has_priority_over>x-fmt/283</has_priority_over>
376
+ <has_priority_over>x-fmt/111</has_priority_over>
377
+ <signature>
378
+ <name>PDB</name>
379
+ <note>80 byte header record: BOF contains "HEADER" and date field (YY-MMM-DD at offset 50) and IDCode (1 digit followed by 3 alphanumeric at offset 63). Also: "END " chunk at beginning of 80 byte footer record </note>
380
+ <pattern>
381
+ <position>BOF</position>
382
+ <!-- <regex>(?s)\AHEADER.{44}\d\d\-[A-Z]{3}-\d\d.{3}\d\w{3}</regex>-->
383
+ <regex>(?s)\AHEADER.{44}[0-9]{3}\-[a-z]{3}\-[0-9]{3}.{3}[0-9]{1}[a-z]{3}</regex>
384
+ </pattern>
385
+ <pattern>
386
+ <position>VAR</position>
387
+ <pronom_pattern>454E442020202020202020202020202020202020202020202020202020202020202020202020202020202020202020202020202020 2020202020202020202020202020202020202020202020202020200A</pronom_pattern>
388
+ <regex>(?s)END\x20{77}\x0A\Z</regex>
389
+ </pattern>
390
+ </signature>
391
+ <note>The Protein Data Bank (pdb) file format is the legacy file format of the Worldwide Protein Data Bank. The mission of the wwPDB is to maintain a single Protein Data Bank Archive of macromolecular structural data that is freely and publicly available to the global community. PDB is a flat textual file format describing the three dimensional structures of molecules held in the Protein Data Bank. The file consists of 80 byte records, beginning with a header and ending with an END record.</note>
392
+ <details>
393
+ <dc:description>PDB is a flat textual file format of macromolecular structural data in the Worldwide Protein Data Bank.</dc:description>
394
+ <dcterms:available>1972</dcterms:available>
395
+ <dc:creator>Brookhaven National Laboratory</dc:creator>
396
+ <dcterms:publisher>Worldwide Protein Data Bank</dcterms:publisher>
397
+ <content_type>ASCII text</content_type>
398
+ <reference>
399
+ <dc:title>Protein Data Bank</dc:title>
400
+ <dc:creator>Brookhaven National Laboratory</dc:creator>
401
+ <dc:publisher>Worldwide Protein Data Bank</dc:publisher>
402
+ <dcterms:available>1972</dcterms:available>
403
+ <dc:identifier>http://www.wwpdb.org/documentation/format33/v3.3.html</dc:identifier>
404
+ <dc:description>PDB is a flat textual file format of macromolecular structural data in the Worldwide Protein Data Bank</dc:description>
405
+ <dc:type>Authoratative</dc:type>
406
+ </reference>
407
+ <record_metadata>
408
+ <status>unknown</status>
409
+ <dc:creator>L. Hurley and A. Ogier</dc:creator>
410
+ <dcterms:created>01 Dec 2011</dcterms:created>
411
+ </record_metadata>
412
+ </details>
413
+ </format>
414
+ <!-- Progressive Graphics File format (PGF) -->
415
+ <!-- contributed by L. Hurley and A. Ogier -->
416
+ <format>
417
+ <puid>fido-fmt/pgf</puid>
418
+ <name>Progressive Graphics File</name>
419
+ <version></version>
420
+ <alias>PGF</alias>
421
+ <extension>pgf</extension>
422
+ <apple_uti>public.data</apple_uti>
423
+ <signature>
424
+ <name>PGF (little-endian)</name>
425
+ <note>Header begins with PGF at offset 00</note>
426
+ <pattern>
427
+ <position>BOF</position>
428
+ <pronom_pattern>504746</pronom_pattern>
429
+ <regex>(?s)\APGF</regex>
430
+ </pattern>
431
+ </signature>
432
+ <details>
433
+ <dc:description>Progressive Graphics Format (PGF) is an image format developed with a focus on speed rather than on compression ratio. It features both lossy (more than 10 without any visual quality loss) and lossless compression (about 3.1 according to the documentation), is based on a fast wavelet transform, and performs best with natural and aerial photos. In comparison with JPEG 2000, it has a slightly worse compression efficiency; however, JPEG 2000 is about 10 times slower than PGF.</dc:description>
434
+ <dcterms:available>18 June 2006</dcterms:available>
435
+ <dc:creator>xerania GmbH</dc:creator>
436
+ <dcterms:publisher>libpgf.org</dcterms:publisher>
437
+ <reference>
438
+ <dcterms:title>PGF: A new progressive file format for lossy and lossless compression</dcterms:title>
439
+ <dc:creator>Christoph Stamm</dc:creator>
440
+ <dcterms:publisher>libpgf.org</dcterms:publisher>
441
+ <dcterms:available></dcterms:available>
442
+ <dc:identifier>http://www.libpgf.org/uploads/media/PGF_Overview_V1_01.pdf</dc:identifier>
443
+ <dc:description>This is the initial presentation of PGF, describing the process used to create the file and summarizing the testing methodology.</dc:description>
444
+ <dc:type>Authoratative</dc:type>
445
+ </reference>
446
+ <reference>
447
+ <dcterms:title>PGF-Progressive Graphics File Version 6</dcterms:title>
448
+ <dc:creator>Christoph Stamm</dc:creator>
449
+ <dcterms:publisher>libpgf.org</dcterms:publisher>
450
+ <dcterms:available></dcterms:available>
451
+ <dc:identifier>http://www.libpgf.org/uploads/media/PGF_Header_ROI_V6_02.pdf</dc:identifier>
452
+ <dc:description>This is documentation for the PGF Header Structure and ROI coding scheme.</dc:description>
453
+ <dc:type>Authoratative</dc:type>
454
+ </reference>
455
+ <record_metadata>
456
+ <status>unknown</status>
457
+ <dc:creator>L. Hurley and A. Ogier</dc:creator>
458
+ <dcterms:created>01 Dec 2011</dcterms:created>
459
+ </record_metadata>
460
+ </details>
461
+ </format>
462
+ <!-- ePub File format (ePub) -->
463
+ <!-- contributed by Kris Dekeyser (LIBIS, Leuven, Belgium) -->
464
+ <!--
465
+ *** NOTE: commented out for the time being as the bugfix for container signatures
466
+ *** which has been committed with version 1.1.8 seems to do the trick
467
+ -->
468
+ <!--
469
+ <format>
470
+ <puid>fmt/483</puid>
471
+ <name>ePub format</name>
472
+ <version>1.0</version>
473
+ <alias>EPUB</alias>
474
+ <mime>application/epub+zip</mime>
475
+ <extension>epub</extension>
476
+ <has_priority_over>x-fmt/263</has_priority_over>
477
+ <has_priority_over>fmt/61</has_priority_over>
478
+ <signature>
479
+ <name>EPUB file</name>
480
+ <pattern>
481
+ <position>BOF</position>
482
+ <regex>(?s)\APK\x03\x04</regex>
483
+ </pattern>
484
+ <pattern>
485
+ <position>BOF</position>
486
+ <regex>(?s)\A.{30}mimetypeapplication/epub\+zip</regex>
487
+ </pattern>
488
+ </signature>
489
+ <details>
490
+ <record_metadata>
491
+ <status>unknown</status>
492
+ <dc:creator>Kris Dekeyser (LIBIS, Leuven, Belgium)</dc:creator>
493
+ <dcterms:created>09 July 2013</dcterms:created>
494
+ </record_metadata>
495
+ </details>
496
+ </format>
497
+ -->
498
+ </formats>