tensorbored 2.21.0rc1769983804__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (271) hide show
  1. tensorbored/__init__.py +112 -0
  2. tensorbored/_vendor/__init__.py +0 -0
  3. tensorbored/_vendor/bleach/__init__.py +125 -0
  4. tensorbored/_vendor/bleach/_vendor/__init__.py +0 -0
  5. tensorbored/_vendor/bleach/_vendor/html5lib/__init__.py +35 -0
  6. tensorbored/_vendor/bleach/_vendor/html5lib/_ihatexml.py +289 -0
  7. tensorbored/_vendor/bleach/_vendor/html5lib/_inputstream.py +918 -0
  8. tensorbored/_vendor/bleach/_vendor/html5lib/_tokenizer.py +1735 -0
  9. tensorbored/_vendor/bleach/_vendor/html5lib/_trie/__init__.py +5 -0
  10. tensorbored/_vendor/bleach/_vendor/html5lib/_trie/_base.py +40 -0
  11. tensorbored/_vendor/bleach/_vendor/html5lib/_trie/py.py +67 -0
  12. tensorbored/_vendor/bleach/_vendor/html5lib/_utils.py +159 -0
  13. tensorbored/_vendor/bleach/_vendor/html5lib/constants.py +2946 -0
  14. tensorbored/_vendor/bleach/_vendor/html5lib/filters/__init__.py +0 -0
  15. tensorbored/_vendor/bleach/_vendor/html5lib/filters/alphabeticalattributes.py +29 -0
  16. tensorbored/_vendor/bleach/_vendor/html5lib/filters/base.py +12 -0
  17. tensorbored/_vendor/bleach/_vendor/html5lib/filters/inject_meta_charset.py +73 -0
  18. tensorbored/_vendor/bleach/_vendor/html5lib/filters/lint.py +93 -0
  19. tensorbored/_vendor/bleach/_vendor/html5lib/filters/optionaltags.py +207 -0
  20. tensorbored/_vendor/bleach/_vendor/html5lib/filters/sanitizer.py +916 -0
  21. tensorbored/_vendor/bleach/_vendor/html5lib/filters/whitespace.py +38 -0
  22. tensorbored/_vendor/bleach/_vendor/html5lib/html5parser.py +2795 -0
  23. tensorbored/_vendor/bleach/_vendor/html5lib/serializer.py +409 -0
  24. tensorbored/_vendor/bleach/_vendor/html5lib/treeadapters/__init__.py +30 -0
  25. tensorbored/_vendor/bleach/_vendor/html5lib/treeadapters/genshi.py +54 -0
  26. tensorbored/_vendor/bleach/_vendor/html5lib/treeadapters/sax.py +50 -0
  27. tensorbored/_vendor/bleach/_vendor/html5lib/treebuilders/__init__.py +88 -0
  28. tensorbored/_vendor/bleach/_vendor/html5lib/treebuilders/base.py +417 -0
  29. tensorbored/_vendor/bleach/_vendor/html5lib/treebuilders/dom.py +239 -0
  30. tensorbored/_vendor/bleach/_vendor/html5lib/treebuilders/etree.py +343 -0
  31. tensorbored/_vendor/bleach/_vendor/html5lib/treebuilders/etree_lxml.py +392 -0
  32. tensorbored/_vendor/bleach/_vendor/html5lib/treewalkers/__init__.py +154 -0
  33. tensorbored/_vendor/bleach/_vendor/html5lib/treewalkers/base.py +252 -0
  34. tensorbored/_vendor/bleach/_vendor/html5lib/treewalkers/dom.py +43 -0
  35. tensorbored/_vendor/bleach/_vendor/html5lib/treewalkers/etree.py +131 -0
  36. tensorbored/_vendor/bleach/_vendor/html5lib/treewalkers/etree_lxml.py +215 -0
  37. tensorbored/_vendor/bleach/_vendor/html5lib/treewalkers/genshi.py +69 -0
  38. tensorbored/_vendor/bleach/_vendor/parse.py +1078 -0
  39. tensorbored/_vendor/bleach/callbacks.py +32 -0
  40. tensorbored/_vendor/bleach/html5lib_shim.py +757 -0
  41. tensorbored/_vendor/bleach/linkifier.py +633 -0
  42. tensorbored/_vendor/bleach/parse_shim.py +1 -0
  43. tensorbored/_vendor/bleach/sanitizer.py +638 -0
  44. tensorbored/_vendor/bleach/six_shim.py +19 -0
  45. tensorbored/_vendor/webencodings/__init__.py +342 -0
  46. tensorbored/_vendor/webencodings/labels.py +231 -0
  47. tensorbored/_vendor/webencodings/mklabels.py +59 -0
  48. tensorbored/_vendor/webencodings/x_user_defined.py +325 -0
  49. tensorbored/assets.py +36 -0
  50. tensorbored/auth.py +102 -0
  51. tensorbored/backend/__init__.py +0 -0
  52. tensorbored/backend/application.py +604 -0
  53. tensorbored/backend/auth_context_middleware.py +38 -0
  54. tensorbored/backend/client_feature_flags.py +113 -0
  55. tensorbored/backend/empty_path_redirect.py +46 -0
  56. tensorbored/backend/event_processing/__init__.py +0 -0
  57. tensorbored/backend/event_processing/data_ingester.py +276 -0
  58. tensorbored/backend/event_processing/data_provider.py +535 -0
  59. tensorbored/backend/event_processing/directory_loader.py +142 -0
  60. tensorbored/backend/event_processing/directory_watcher.py +272 -0
  61. tensorbored/backend/event_processing/event_accumulator.py +950 -0
  62. tensorbored/backend/event_processing/event_file_inspector.py +463 -0
  63. tensorbored/backend/event_processing/event_file_loader.py +292 -0
  64. tensorbored/backend/event_processing/event_multiplexer.py +521 -0
  65. tensorbored/backend/event_processing/event_util.py +68 -0
  66. tensorbored/backend/event_processing/io_wrapper.py +223 -0
  67. tensorbored/backend/event_processing/plugin_asset_util.py +104 -0
  68. tensorbored/backend/event_processing/plugin_event_accumulator.py +721 -0
  69. tensorbored/backend/event_processing/plugin_event_multiplexer.py +522 -0
  70. tensorbored/backend/event_processing/reservoir.py +266 -0
  71. tensorbored/backend/event_processing/tag_types.py +29 -0
  72. tensorbored/backend/experiment_id.py +71 -0
  73. tensorbored/backend/experimental_plugin.py +51 -0
  74. tensorbored/backend/http_util.py +263 -0
  75. tensorbored/backend/json_util.py +70 -0
  76. tensorbored/backend/path_prefix.py +67 -0
  77. tensorbored/backend/process_graph.py +74 -0
  78. tensorbored/backend/security_validator.py +202 -0
  79. tensorbored/compat/__init__.py +69 -0
  80. tensorbored/compat/proto/__init__.py +0 -0
  81. tensorbored/compat/proto/allocation_description_pb2.py +35 -0
  82. tensorbored/compat/proto/api_def_pb2.py +82 -0
  83. tensorbored/compat/proto/attr_value_pb2.py +80 -0
  84. tensorbored/compat/proto/cluster_pb2.py +58 -0
  85. tensorbored/compat/proto/config_pb2.py +271 -0
  86. tensorbored/compat/proto/coordination_config_pb2.py +45 -0
  87. tensorbored/compat/proto/cost_graph_pb2.py +87 -0
  88. tensorbored/compat/proto/cpp_shape_inference_pb2.py +70 -0
  89. tensorbored/compat/proto/debug_pb2.py +65 -0
  90. tensorbored/compat/proto/event_pb2.py +149 -0
  91. tensorbored/compat/proto/full_type_pb2.py +74 -0
  92. tensorbored/compat/proto/function_pb2.py +157 -0
  93. tensorbored/compat/proto/graph_debug_info_pb2.py +111 -0
  94. tensorbored/compat/proto/graph_pb2.py +41 -0
  95. tensorbored/compat/proto/histogram_pb2.py +39 -0
  96. tensorbored/compat/proto/meta_graph_pb2.py +254 -0
  97. tensorbored/compat/proto/node_def_pb2.py +61 -0
  98. tensorbored/compat/proto/op_def_pb2.py +81 -0
  99. tensorbored/compat/proto/resource_handle_pb2.py +48 -0
  100. tensorbored/compat/proto/rewriter_config_pb2.py +93 -0
  101. tensorbored/compat/proto/rpc_options_pb2.py +35 -0
  102. tensorbored/compat/proto/saved_object_graph_pb2.py +193 -0
  103. tensorbored/compat/proto/saver_pb2.py +38 -0
  104. tensorbored/compat/proto/step_stats_pb2.py +116 -0
  105. tensorbored/compat/proto/struct_pb2.py +144 -0
  106. tensorbored/compat/proto/summary_pb2.py +111 -0
  107. tensorbored/compat/proto/tensor_description_pb2.py +38 -0
  108. tensorbored/compat/proto/tensor_pb2.py +68 -0
  109. tensorbored/compat/proto/tensor_shape_pb2.py +46 -0
  110. tensorbored/compat/proto/tfprof_log_pb2.py +307 -0
  111. tensorbored/compat/proto/trackable_object_graph_pb2.py +90 -0
  112. tensorbored/compat/proto/types_pb2.py +105 -0
  113. tensorbored/compat/proto/variable_pb2.py +62 -0
  114. tensorbored/compat/proto/verifier_config_pb2.py +38 -0
  115. tensorbored/compat/proto/versions_pb2.py +35 -0
  116. tensorbored/compat/tensorflow_stub/__init__.py +38 -0
  117. tensorbored/compat/tensorflow_stub/app.py +124 -0
  118. tensorbored/compat/tensorflow_stub/compat/__init__.py +131 -0
  119. tensorbored/compat/tensorflow_stub/compat/v1/__init__.py +20 -0
  120. tensorbored/compat/tensorflow_stub/dtypes.py +692 -0
  121. tensorbored/compat/tensorflow_stub/error_codes.py +169 -0
  122. tensorbored/compat/tensorflow_stub/errors.py +507 -0
  123. tensorbored/compat/tensorflow_stub/flags.py +124 -0
  124. tensorbored/compat/tensorflow_stub/io/__init__.py +17 -0
  125. tensorbored/compat/tensorflow_stub/io/gfile.py +1011 -0
  126. tensorbored/compat/tensorflow_stub/pywrap_tensorflow.py +285 -0
  127. tensorbored/compat/tensorflow_stub/tensor_shape.py +1035 -0
  128. tensorbored/context.py +129 -0
  129. tensorbored/data/__init__.py +0 -0
  130. tensorbored/data/grpc_provider.py +365 -0
  131. tensorbored/data/ingester.py +46 -0
  132. tensorbored/data/proto/__init__.py +0 -0
  133. tensorbored/data/proto/data_provider_pb2.py +517 -0
  134. tensorbored/data/proto/data_provider_pb2_grpc.py +374 -0
  135. tensorbored/data/provider.py +1365 -0
  136. tensorbored/data/server_ingester.py +301 -0
  137. tensorbored/data_compat.py +159 -0
  138. tensorbored/dataclass_compat.py +224 -0
  139. tensorbored/default.py +124 -0
  140. tensorbored/errors.py +130 -0
  141. tensorbored/lazy.py +99 -0
  142. tensorbored/main.py +48 -0
  143. tensorbored/main_lib.py +62 -0
  144. tensorbored/manager.py +487 -0
  145. tensorbored/notebook.py +441 -0
  146. tensorbored/plugin_util.py +266 -0
  147. tensorbored/plugins/__init__.py +0 -0
  148. tensorbored/plugins/audio/__init__.py +0 -0
  149. tensorbored/plugins/audio/audio_plugin.py +229 -0
  150. tensorbored/plugins/audio/metadata.py +69 -0
  151. tensorbored/plugins/audio/plugin_data_pb2.py +37 -0
  152. tensorbored/plugins/audio/summary.py +230 -0
  153. tensorbored/plugins/audio/summary_v2.py +124 -0
  154. tensorbored/plugins/base_plugin.py +367 -0
  155. tensorbored/plugins/core/__init__.py +0 -0
  156. tensorbored/plugins/core/core_plugin.py +981 -0
  157. tensorbored/plugins/custom_scalar/__init__.py +0 -0
  158. tensorbored/plugins/custom_scalar/custom_scalars_plugin.py +320 -0
  159. tensorbored/plugins/custom_scalar/layout_pb2.py +85 -0
  160. tensorbored/plugins/custom_scalar/metadata.py +35 -0
  161. tensorbored/plugins/custom_scalar/summary.py +79 -0
  162. tensorbored/plugins/debugger_v2/__init__.py +0 -0
  163. tensorbored/plugins/debugger_v2/debug_data_multiplexer.py +631 -0
  164. tensorbored/plugins/debugger_v2/debug_data_provider.py +634 -0
  165. tensorbored/plugins/debugger_v2/debugger_v2_plugin.py +504 -0
  166. tensorbored/plugins/distribution/__init__.py +0 -0
  167. tensorbored/plugins/distribution/compressor.py +158 -0
  168. tensorbored/plugins/distribution/distributions_plugin.py +116 -0
  169. tensorbored/plugins/distribution/metadata.py +19 -0
  170. tensorbored/plugins/graph/__init__.py +0 -0
  171. tensorbored/plugins/graph/graph_util.py +129 -0
  172. tensorbored/plugins/graph/graphs_plugin.py +336 -0
  173. tensorbored/plugins/graph/keras_util.py +328 -0
  174. tensorbored/plugins/graph/metadata.py +42 -0
  175. tensorbored/plugins/histogram/__init__.py +0 -0
  176. tensorbored/plugins/histogram/histograms_plugin.py +144 -0
  177. tensorbored/plugins/histogram/metadata.py +63 -0
  178. tensorbored/plugins/histogram/plugin_data_pb2.py +34 -0
  179. tensorbored/plugins/histogram/summary.py +234 -0
  180. tensorbored/plugins/histogram/summary_v2.py +292 -0
  181. tensorbored/plugins/hparams/__init__.py +14 -0
  182. tensorbored/plugins/hparams/_keras.py +93 -0
  183. tensorbored/plugins/hparams/api.py +130 -0
  184. tensorbored/plugins/hparams/api_pb2.py +208 -0
  185. tensorbored/plugins/hparams/backend_context.py +606 -0
  186. tensorbored/plugins/hparams/download_data.py +158 -0
  187. tensorbored/plugins/hparams/error.py +26 -0
  188. tensorbored/plugins/hparams/get_experiment.py +71 -0
  189. tensorbored/plugins/hparams/hparams_plugin.py +206 -0
  190. tensorbored/plugins/hparams/hparams_util_pb2.py +69 -0
  191. tensorbored/plugins/hparams/json_format_compat.py +38 -0
  192. tensorbored/plugins/hparams/list_metric_evals.py +57 -0
  193. tensorbored/plugins/hparams/list_session_groups.py +1040 -0
  194. tensorbored/plugins/hparams/metadata.py +125 -0
  195. tensorbored/plugins/hparams/metrics.py +41 -0
  196. tensorbored/plugins/hparams/plugin_data_pb2.py +69 -0
  197. tensorbored/plugins/hparams/summary.py +205 -0
  198. tensorbored/plugins/hparams/summary_v2.py +597 -0
  199. tensorbored/plugins/image/__init__.py +0 -0
  200. tensorbored/plugins/image/images_plugin.py +232 -0
  201. tensorbored/plugins/image/metadata.py +65 -0
  202. tensorbored/plugins/image/plugin_data_pb2.py +34 -0
  203. tensorbored/plugins/image/summary.py +159 -0
  204. tensorbored/plugins/image/summary_v2.py +130 -0
  205. tensorbored/plugins/mesh/__init__.py +14 -0
  206. tensorbored/plugins/mesh/mesh_plugin.py +292 -0
  207. tensorbored/plugins/mesh/metadata.py +152 -0
  208. tensorbored/plugins/mesh/plugin_data_pb2.py +37 -0
  209. tensorbored/plugins/mesh/summary.py +251 -0
  210. tensorbored/plugins/mesh/summary_v2.py +214 -0
  211. tensorbored/plugins/metrics/__init__.py +0 -0
  212. tensorbored/plugins/metrics/metadata.py +17 -0
  213. tensorbored/plugins/metrics/metrics_plugin.py +623 -0
  214. tensorbored/plugins/pr_curve/__init__.py +0 -0
  215. tensorbored/plugins/pr_curve/metadata.py +75 -0
  216. tensorbored/plugins/pr_curve/plugin_data_pb2.py +34 -0
  217. tensorbored/plugins/pr_curve/pr_curves_plugin.py +241 -0
  218. tensorbored/plugins/pr_curve/summary.py +574 -0
  219. tensorbored/plugins/profile_redirect/__init__.py +0 -0
  220. tensorbored/plugins/profile_redirect/profile_redirect_plugin.py +49 -0
  221. tensorbored/plugins/projector/__init__.py +67 -0
  222. tensorbored/plugins/projector/metadata.py +26 -0
  223. tensorbored/plugins/projector/projector_config_pb2.py +54 -0
  224. tensorbored/plugins/projector/projector_plugin.py +795 -0
  225. tensorbored/plugins/projector/tf_projector_plugin/index.js +32 -0
  226. tensorbored/plugins/projector/tf_projector_plugin/projector_binary.html +524 -0
  227. tensorbored/plugins/projector/tf_projector_plugin/projector_binary.js +15536 -0
  228. tensorbored/plugins/scalar/__init__.py +0 -0
  229. tensorbored/plugins/scalar/metadata.py +60 -0
  230. tensorbored/plugins/scalar/plugin_data_pb2.py +34 -0
  231. tensorbored/plugins/scalar/scalars_plugin.py +181 -0
  232. tensorbored/plugins/scalar/summary.py +109 -0
  233. tensorbored/plugins/scalar/summary_v2.py +124 -0
  234. tensorbored/plugins/text/__init__.py +0 -0
  235. tensorbored/plugins/text/metadata.py +62 -0
  236. tensorbored/plugins/text/plugin_data_pb2.py +34 -0
  237. tensorbored/plugins/text/summary.py +114 -0
  238. tensorbored/plugins/text/summary_v2.py +124 -0
  239. tensorbored/plugins/text/text_plugin.py +288 -0
  240. tensorbored/plugins/wit_redirect/__init__.py +0 -0
  241. tensorbored/plugins/wit_redirect/wit_redirect_plugin.py +49 -0
  242. tensorbored/program.py +910 -0
  243. tensorbored/summary/__init__.py +35 -0
  244. tensorbored/summary/_output.py +124 -0
  245. tensorbored/summary/_tf/__init__.py +14 -0
  246. tensorbored/summary/_tf/summary/__init__.py +178 -0
  247. tensorbored/summary/_writer.py +105 -0
  248. tensorbored/summary/v1.py +51 -0
  249. tensorbored/summary/v2.py +25 -0
  250. tensorbored/summary/writer/__init__.py +13 -0
  251. tensorbored/summary/writer/event_file_writer.py +291 -0
  252. tensorbored/summary/writer/record_writer.py +50 -0
  253. tensorbored/util/__init__.py +0 -0
  254. tensorbored/util/encoder.py +116 -0
  255. tensorbored/util/grpc_util.py +311 -0
  256. tensorbored/util/img_mime_type_detector.py +40 -0
  257. tensorbored/util/io_util.py +20 -0
  258. tensorbored/util/lazy_tensor_creator.py +110 -0
  259. tensorbored/util/op_evaluator.py +104 -0
  260. tensorbored/util/platform_util.py +20 -0
  261. tensorbored/util/tb_logging.py +24 -0
  262. tensorbored/util/tensor_util.py +617 -0
  263. tensorbored/util/timing.py +122 -0
  264. tensorbored/version.py +21 -0
  265. tensorbored/webfiles.zip +0 -0
  266. tensorbored-2.21.0rc1769983804.dist-info/METADATA +49 -0
  267. tensorbored-2.21.0rc1769983804.dist-info/RECORD +271 -0
  268. tensorbored-2.21.0rc1769983804.dist-info/WHEEL +5 -0
  269. tensorbored-2.21.0rc1769983804.dist-info/entry_points.txt +6 -0
  270. tensorbored-2.21.0rc1769983804.dist-info/licenses/LICENSE +739 -0
  271. tensorbored-2.21.0rc1769983804.dist-info/top_level.txt +1 -0
@@ -0,0 +1,342 @@
1
+ # coding: utf-8
2
+ """
3
+
4
+ webencodings
5
+ ~~~~~~~~~~~~
6
+
7
+ This is a Python implementation of the `WHATWG Encoding standard
8
+ <http://encoding.spec.whatwg.org/>`. See README for details.
9
+
10
+ :copyright: Copyright 2012 by Simon Sapin
11
+ :license: BSD, see LICENSE for details.
12
+
13
+ """
14
+
15
+ from __future__ import unicode_literals
16
+
17
+ import codecs
18
+
19
+ from .labels import LABELS
20
+
21
+
22
+ VERSION = '0.5.1'
23
+
24
+
25
+ # Some names in Encoding are not valid Python aliases. Remap these.
26
+ PYTHON_NAMES = {
27
+ 'iso-8859-8-i': 'iso-8859-8',
28
+ 'x-mac-cyrillic': 'mac-cyrillic',
29
+ 'macintosh': 'mac-roman',
30
+ 'windows-874': 'cp874'}
31
+
32
+ CACHE = {}
33
+
34
+
35
+ def ascii_lower(string):
36
+ r"""Transform (only) ASCII letters to lower case: A-Z is mapped to a-z.
37
+
38
+ :param string: An Unicode string.
39
+ :returns: A new Unicode string.
40
+
41
+ This is used for `ASCII case-insensitive
42
+ <http://encoding.spec.whatwg.org/#ascii-case-insensitive>`_
43
+ matching of encoding labels.
44
+ The same matching is also used, among other things,
45
+ for `CSS keywords <http://dev.w3.org/csswg/css-values/#keywords>`_.
46
+
47
+ This is different from the :meth:`~py:str.lower` method of Unicode strings
48
+ which also affect non-ASCII characters,
49
+ sometimes mapping them into the ASCII range:
50
+
51
+ >>> keyword = u'Bac\N{KELVIN SIGN}ground'
52
+ >>> assert keyword.lower() == u'background'
53
+ >>> assert ascii_lower(keyword) != keyword.lower()
54
+ >>> assert ascii_lower(keyword) == u'bac\N{KELVIN SIGN}ground'
55
+
56
+ """
57
+ # This turns out to be faster than unicode.translate()
58
+ return string.encode('utf8').lower().decode('utf8')
59
+
60
+
61
+ def lookup(label):
62
+ """
63
+ Look for an encoding by its label.
64
+ This is the spec’s `get an encoding
65
+ <http://encoding.spec.whatwg.org/#concept-encoding-get>`_ algorithm.
66
+ Supported labels are listed there.
67
+
68
+ :param label: A string.
69
+ :returns:
70
+ An :class:`Encoding` object, or :obj:`None` for an unknown label.
71
+
72
+ """
73
+ # Only strip ASCII whitespace: U+0009, U+000A, U+000C, U+000D, and U+0020.
74
+ label = ascii_lower(label.strip('\t\n\f\r '))
75
+ name = LABELS.get(label)
76
+ if name is None:
77
+ return None
78
+ encoding = CACHE.get(name)
79
+ if encoding is None:
80
+ if name == 'x-user-defined':
81
+ from .x_user_defined import codec_info
82
+ else:
83
+ python_name = PYTHON_NAMES.get(name, name)
84
+ # Any python_name value that gets to here should be valid.
85
+ codec_info = codecs.lookup(python_name)
86
+ encoding = Encoding(name, codec_info)
87
+ CACHE[name] = encoding
88
+ return encoding
89
+
90
+
91
+ def _get_encoding(encoding_or_label):
92
+ """
93
+ Accept either an encoding object or label.
94
+
95
+ :param encoding: An :class:`Encoding` object or a label string.
96
+ :returns: An :class:`Encoding` object.
97
+ :raises: :exc:`~exceptions.LookupError` for an unknown label.
98
+
99
+ """
100
+ if hasattr(encoding_or_label, 'codec_info'):
101
+ return encoding_or_label
102
+
103
+ encoding = lookup(encoding_or_label)
104
+ if encoding is None:
105
+ raise LookupError('Unknown encoding label: %r' % encoding_or_label)
106
+ return encoding
107
+
108
+
109
+ class Encoding(object):
110
+ """Reresents a character encoding such as UTF-8,
111
+ that can be used for decoding or encoding.
112
+
113
+ .. attribute:: name
114
+
115
+ Canonical name of the encoding
116
+
117
+ .. attribute:: codec_info
118
+
119
+ The actual implementation of the encoding,
120
+ a stdlib :class:`~codecs.CodecInfo` object.
121
+ See :func:`codecs.register`.
122
+
123
+ """
124
+ def __init__(self, name, codec_info):
125
+ self.name = name
126
+ self.codec_info = codec_info
127
+
128
+ def __repr__(self):
129
+ return '<Encoding %s>' % self.name
130
+
131
+
132
+ #: The UTF-8 encoding. Should be used for new content and formats.
133
+ UTF8 = lookup('utf-8')
134
+
135
+ _UTF16LE = lookup('utf-16le')
136
+ _UTF16BE = lookup('utf-16be')
137
+
138
+
139
+ def decode(input, fallback_encoding, errors='replace'):
140
+ """
141
+ Decode a single string.
142
+
143
+ :param input: A byte string
144
+ :param fallback_encoding:
145
+ An :class:`Encoding` object or a label string.
146
+ The encoding to use if :obj:`input` does note have a BOM.
147
+ :param errors: Type of error handling. See :func:`codecs.register`.
148
+ :raises: :exc:`~exceptions.LookupError` for an unknown encoding label.
149
+ :return:
150
+ A ``(output, encoding)`` tuple of an Unicode string
151
+ and an :obj:`Encoding`.
152
+
153
+ """
154
+ # Fail early if `encoding` is an invalid label.
155
+ fallback_encoding = _get_encoding(fallback_encoding)
156
+ bom_encoding, input = _detect_bom(input)
157
+ encoding = bom_encoding or fallback_encoding
158
+ return encoding.codec_info.decode(input, errors)[0], encoding
159
+
160
+
161
+ def _detect_bom(input):
162
+ """Return (bom_encoding, input), with any BOM removed from the input."""
163
+ if input.startswith(b'\xFF\xFE'):
164
+ return _UTF16LE, input[2:]
165
+ if input.startswith(b'\xFE\xFF'):
166
+ return _UTF16BE, input[2:]
167
+ if input.startswith(b'\xEF\xBB\xBF'):
168
+ return UTF8, input[3:]
169
+ return None, input
170
+
171
+
172
+ def encode(input, encoding=UTF8, errors='strict'):
173
+ """
174
+ Encode a single string.
175
+
176
+ :param input: An Unicode string.
177
+ :param encoding: An :class:`Encoding` object or a label string.
178
+ :param errors: Type of error handling. See :func:`codecs.register`.
179
+ :raises: :exc:`~exceptions.LookupError` for an unknown encoding label.
180
+ :return: A byte string.
181
+
182
+ """
183
+ return _get_encoding(encoding).codec_info.encode(input, errors)[0]
184
+
185
+
186
+ def iter_decode(input, fallback_encoding, errors='replace'):
187
+ """
188
+ "Pull"-based decoder.
189
+
190
+ :param input:
191
+ An iterable of byte strings.
192
+
193
+ The input is first consumed just enough to determine the encoding
194
+ based on the precense of a BOM,
195
+ then consumed on demand when the return value is.
196
+ :param fallback_encoding:
197
+ An :class:`Encoding` object or a label string.
198
+ The encoding to use if :obj:`input` does note have a BOM.
199
+ :param errors: Type of error handling. See :func:`codecs.register`.
200
+ :raises: :exc:`~exceptions.LookupError` for an unknown encoding label.
201
+ :returns:
202
+ An ``(output, encoding)`` tuple.
203
+ :obj:`output` is an iterable of Unicode strings,
204
+ :obj:`encoding` is the :obj:`Encoding` that is being used.
205
+
206
+ """
207
+
208
+ decoder = IncrementalDecoder(fallback_encoding, errors)
209
+ generator = _iter_decode_generator(input, decoder)
210
+ encoding = next(generator)
211
+ return generator, encoding
212
+
213
+
214
+ def _iter_decode_generator(input, decoder):
215
+ """Return a generator that first yields the :obj:`Encoding`,
216
+ then yields output chukns as Unicode strings.
217
+
218
+ """
219
+ decode = decoder.decode
220
+ input = iter(input)
221
+ for chunck in input:
222
+ output = decode(chunck)
223
+ if output:
224
+ assert decoder.encoding is not None
225
+ yield decoder.encoding
226
+ yield output
227
+ break
228
+ else:
229
+ # Input exhausted without determining the encoding
230
+ output = decode(b'', final=True)
231
+ assert decoder.encoding is not None
232
+ yield decoder.encoding
233
+ if output:
234
+ yield output
235
+ return
236
+
237
+ for chunck in input:
238
+ output = decode(chunck)
239
+ if output:
240
+ yield output
241
+ output = decode(b'', final=True)
242
+ if output:
243
+ yield output
244
+
245
+
246
+ def iter_encode(input, encoding=UTF8, errors='strict'):
247
+ """
248
+ “Pull”-based encoder.
249
+
250
+ :param input: An iterable of Unicode strings.
251
+ :param encoding: An :class:`Encoding` object or a label string.
252
+ :param errors: Type of error handling. See :func:`codecs.register`.
253
+ :raises: :exc:`~exceptions.LookupError` for an unknown encoding label.
254
+ :returns: An iterable of byte strings.
255
+
256
+ """
257
+ # Fail early if `encoding` is an invalid label.
258
+ encode = IncrementalEncoder(encoding, errors).encode
259
+ return _iter_encode_generator(input, encode)
260
+
261
+
262
+ def _iter_encode_generator(input, encode):
263
+ for chunck in input:
264
+ output = encode(chunck)
265
+ if output:
266
+ yield output
267
+ output = encode('', final=True)
268
+ if output:
269
+ yield output
270
+
271
+
272
+ class IncrementalDecoder(object):
273
+ """
274
+ “Push”-based decoder.
275
+
276
+ :param fallback_encoding:
277
+ An :class:`Encoding` object or a label string.
278
+ The encoding to use if :obj:`input` does note have a BOM.
279
+ :param errors: Type of error handling. See :func:`codecs.register`.
280
+ :raises: :exc:`~exceptions.LookupError` for an unknown encoding label.
281
+
282
+ """
283
+ def __init__(self, fallback_encoding, errors='replace'):
284
+ # Fail early if `encoding` is an invalid label.
285
+ self._fallback_encoding = _get_encoding(fallback_encoding)
286
+ self._errors = errors
287
+ self._buffer = b''
288
+ self._decoder = None
289
+ #: The actual :class:`Encoding` that is being used,
290
+ #: or :obj:`None` if that is not determined yet.
291
+ #: (Ie. if there is not enough input yet to determine
292
+ #: if there is a BOM.)
293
+ self.encoding = None # Not known yet.
294
+
295
+ def decode(self, input, final=False):
296
+ """Decode one chunk of the input.
297
+
298
+ :param input: A byte string.
299
+ :param final:
300
+ Indicate that no more input is available.
301
+ Must be :obj:`True` if this is the last call.
302
+ :returns: An Unicode string.
303
+
304
+ """
305
+ decoder = self._decoder
306
+ if decoder is not None:
307
+ return decoder(input, final)
308
+
309
+ input = self._buffer + input
310
+ encoding, input = _detect_bom(input)
311
+ if encoding is None:
312
+ if len(input) < 3 and not final: # Not enough data yet.
313
+ self._buffer = input
314
+ return ''
315
+ else: # No BOM
316
+ encoding = self._fallback_encoding
317
+ decoder = encoding.codec_info.incrementaldecoder(self._errors).decode
318
+ self._decoder = decoder
319
+ self.encoding = encoding
320
+ return decoder(input, final)
321
+
322
+
323
+ class IncrementalEncoder(object):
324
+ """
325
+ “Push”-based encoder.
326
+
327
+ :param encoding: An :class:`Encoding` object or a label string.
328
+ :param errors: Type of error handling. See :func:`codecs.register`.
329
+ :raises: :exc:`~exceptions.LookupError` for an unknown encoding label.
330
+
331
+ .. method:: encode(input, final=False)
332
+
333
+ :param input: An Unicode string.
334
+ :param final:
335
+ Indicate that no more input is available.
336
+ Must be :obj:`True` if this is the last call.
337
+ :returns: A byte string.
338
+
339
+ """
340
+ def __init__(self, encoding=UTF8, errors='strict'):
341
+ encoding = _get_encoding(encoding)
342
+ self.encode = encoding.codec_info.incrementalencoder(errors).encode
@@ -0,0 +1,231 @@
1
+ """
2
+
3
+ webencodings.labels
4
+ ~~~~~~~~~~~~~~~~~~~
5
+
6
+ Map encoding labels to their name.
7
+
8
+ :copyright: Copyright 2012 by Simon Sapin
9
+ :license: BSD, see LICENSE for details.
10
+
11
+ """
12
+
13
+ # XXX Do not edit!
14
+ # This file is automatically generated by mklabels.py
15
+
16
+ LABELS = {
17
+ 'unicode-1-1-utf-8': 'utf-8',
18
+ 'utf-8': 'utf-8',
19
+ 'utf8': 'utf-8',
20
+ '866': 'ibm866',
21
+ 'cp866': 'ibm866',
22
+ 'csibm866': 'ibm866',
23
+ 'ibm866': 'ibm866',
24
+ 'csisolatin2': 'iso-8859-2',
25
+ 'iso-8859-2': 'iso-8859-2',
26
+ 'iso-ir-101': 'iso-8859-2',
27
+ 'iso8859-2': 'iso-8859-2',
28
+ 'iso88592': 'iso-8859-2',
29
+ 'iso_8859-2': 'iso-8859-2',
30
+ 'iso_8859-2:1987': 'iso-8859-2',
31
+ 'l2': 'iso-8859-2',
32
+ 'latin2': 'iso-8859-2',
33
+ 'csisolatin3': 'iso-8859-3',
34
+ 'iso-8859-3': 'iso-8859-3',
35
+ 'iso-ir-109': 'iso-8859-3',
36
+ 'iso8859-3': 'iso-8859-3',
37
+ 'iso88593': 'iso-8859-3',
38
+ 'iso_8859-3': 'iso-8859-3',
39
+ 'iso_8859-3:1988': 'iso-8859-3',
40
+ 'l3': 'iso-8859-3',
41
+ 'latin3': 'iso-8859-3',
42
+ 'csisolatin4': 'iso-8859-4',
43
+ 'iso-8859-4': 'iso-8859-4',
44
+ 'iso-ir-110': 'iso-8859-4',
45
+ 'iso8859-4': 'iso-8859-4',
46
+ 'iso88594': 'iso-8859-4',
47
+ 'iso_8859-4': 'iso-8859-4',
48
+ 'iso_8859-4:1988': 'iso-8859-4',
49
+ 'l4': 'iso-8859-4',
50
+ 'latin4': 'iso-8859-4',
51
+ 'csisolatincyrillic': 'iso-8859-5',
52
+ 'cyrillic': 'iso-8859-5',
53
+ 'iso-8859-5': 'iso-8859-5',
54
+ 'iso-ir-144': 'iso-8859-5',
55
+ 'iso8859-5': 'iso-8859-5',
56
+ 'iso88595': 'iso-8859-5',
57
+ 'iso_8859-5': 'iso-8859-5',
58
+ 'iso_8859-5:1988': 'iso-8859-5',
59
+ 'arabic': 'iso-8859-6',
60
+ 'asmo-708': 'iso-8859-6',
61
+ 'csiso88596e': 'iso-8859-6',
62
+ 'csiso88596i': 'iso-8859-6',
63
+ 'csisolatinarabic': 'iso-8859-6',
64
+ 'ecma-114': 'iso-8859-6',
65
+ 'iso-8859-6': 'iso-8859-6',
66
+ 'iso-8859-6-e': 'iso-8859-6',
67
+ 'iso-8859-6-i': 'iso-8859-6',
68
+ 'iso-ir-127': 'iso-8859-6',
69
+ 'iso8859-6': 'iso-8859-6',
70
+ 'iso88596': 'iso-8859-6',
71
+ 'iso_8859-6': 'iso-8859-6',
72
+ 'iso_8859-6:1987': 'iso-8859-6',
73
+ 'csisolatingreek': 'iso-8859-7',
74
+ 'ecma-118': 'iso-8859-7',
75
+ 'elot_928': 'iso-8859-7',
76
+ 'greek': 'iso-8859-7',
77
+ 'greek8': 'iso-8859-7',
78
+ 'iso-8859-7': 'iso-8859-7',
79
+ 'iso-ir-126': 'iso-8859-7',
80
+ 'iso8859-7': 'iso-8859-7',
81
+ 'iso88597': 'iso-8859-7',
82
+ 'iso_8859-7': 'iso-8859-7',
83
+ 'iso_8859-7:1987': 'iso-8859-7',
84
+ 'sun_eu_greek': 'iso-8859-7',
85
+ 'csiso88598e': 'iso-8859-8',
86
+ 'csisolatinhebrew': 'iso-8859-8',
87
+ 'hebrew': 'iso-8859-8',
88
+ 'iso-8859-8': 'iso-8859-8',
89
+ 'iso-8859-8-e': 'iso-8859-8',
90
+ 'iso-ir-138': 'iso-8859-8',
91
+ 'iso8859-8': 'iso-8859-8',
92
+ 'iso88598': 'iso-8859-8',
93
+ 'iso_8859-8': 'iso-8859-8',
94
+ 'iso_8859-8:1988': 'iso-8859-8',
95
+ 'visual': 'iso-8859-8',
96
+ 'csiso88598i': 'iso-8859-8-i',
97
+ 'iso-8859-8-i': 'iso-8859-8-i',
98
+ 'logical': 'iso-8859-8-i',
99
+ 'csisolatin6': 'iso-8859-10',
100
+ 'iso-8859-10': 'iso-8859-10',
101
+ 'iso-ir-157': 'iso-8859-10',
102
+ 'iso8859-10': 'iso-8859-10',
103
+ 'iso885910': 'iso-8859-10',
104
+ 'l6': 'iso-8859-10',
105
+ 'latin6': 'iso-8859-10',
106
+ 'iso-8859-13': 'iso-8859-13',
107
+ 'iso8859-13': 'iso-8859-13',
108
+ 'iso885913': 'iso-8859-13',
109
+ 'iso-8859-14': 'iso-8859-14',
110
+ 'iso8859-14': 'iso-8859-14',
111
+ 'iso885914': 'iso-8859-14',
112
+ 'csisolatin9': 'iso-8859-15',
113
+ 'iso-8859-15': 'iso-8859-15',
114
+ 'iso8859-15': 'iso-8859-15',
115
+ 'iso885915': 'iso-8859-15',
116
+ 'iso_8859-15': 'iso-8859-15',
117
+ 'l9': 'iso-8859-15',
118
+ 'iso-8859-16': 'iso-8859-16',
119
+ 'cskoi8r': 'koi8-r',
120
+ 'koi': 'koi8-r',
121
+ 'koi8': 'koi8-r',
122
+ 'koi8-r': 'koi8-r',
123
+ 'koi8_r': 'koi8-r',
124
+ 'koi8-u': 'koi8-u',
125
+ 'csmacintosh': 'macintosh',
126
+ 'mac': 'macintosh',
127
+ 'macintosh': 'macintosh',
128
+ 'x-mac-roman': 'macintosh',
129
+ 'dos-874': 'windows-874',
130
+ 'iso-8859-11': 'windows-874',
131
+ 'iso8859-11': 'windows-874',
132
+ 'iso885911': 'windows-874',
133
+ 'tis-620': 'windows-874',
134
+ 'windows-874': 'windows-874',
135
+ 'cp1250': 'windows-1250',
136
+ 'windows-1250': 'windows-1250',
137
+ 'x-cp1250': 'windows-1250',
138
+ 'cp1251': 'windows-1251',
139
+ 'windows-1251': 'windows-1251',
140
+ 'x-cp1251': 'windows-1251',
141
+ 'ansi_x3.4-1968': 'windows-1252',
142
+ 'ascii': 'windows-1252',
143
+ 'cp1252': 'windows-1252',
144
+ 'cp819': 'windows-1252',
145
+ 'csisolatin1': 'windows-1252',
146
+ 'ibm819': 'windows-1252',
147
+ 'iso-8859-1': 'windows-1252',
148
+ 'iso-ir-100': 'windows-1252',
149
+ 'iso8859-1': 'windows-1252',
150
+ 'iso88591': 'windows-1252',
151
+ 'iso_8859-1': 'windows-1252',
152
+ 'iso_8859-1:1987': 'windows-1252',
153
+ 'l1': 'windows-1252',
154
+ 'latin1': 'windows-1252',
155
+ 'us-ascii': 'windows-1252',
156
+ 'windows-1252': 'windows-1252',
157
+ 'x-cp1252': 'windows-1252',
158
+ 'cp1253': 'windows-1253',
159
+ 'windows-1253': 'windows-1253',
160
+ 'x-cp1253': 'windows-1253',
161
+ 'cp1254': 'windows-1254',
162
+ 'csisolatin5': 'windows-1254',
163
+ 'iso-8859-9': 'windows-1254',
164
+ 'iso-ir-148': 'windows-1254',
165
+ 'iso8859-9': 'windows-1254',
166
+ 'iso88599': 'windows-1254',
167
+ 'iso_8859-9': 'windows-1254',
168
+ 'iso_8859-9:1989': 'windows-1254',
169
+ 'l5': 'windows-1254',
170
+ 'latin5': 'windows-1254',
171
+ 'windows-1254': 'windows-1254',
172
+ 'x-cp1254': 'windows-1254',
173
+ 'cp1255': 'windows-1255',
174
+ 'windows-1255': 'windows-1255',
175
+ 'x-cp1255': 'windows-1255',
176
+ 'cp1256': 'windows-1256',
177
+ 'windows-1256': 'windows-1256',
178
+ 'x-cp1256': 'windows-1256',
179
+ 'cp1257': 'windows-1257',
180
+ 'windows-1257': 'windows-1257',
181
+ 'x-cp1257': 'windows-1257',
182
+ 'cp1258': 'windows-1258',
183
+ 'windows-1258': 'windows-1258',
184
+ 'x-cp1258': 'windows-1258',
185
+ 'x-mac-cyrillic': 'x-mac-cyrillic',
186
+ 'x-mac-ukrainian': 'x-mac-cyrillic',
187
+ 'chinese': 'gbk',
188
+ 'csgb2312': 'gbk',
189
+ 'csiso58gb231280': 'gbk',
190
+ 'gb2312': 'gbk',
191
+ 'gb_2312': 'gbk',
192
+ 'gb_2312-80': 'gbk',
193
+ 'gbk': 'gbk',
194
+ 'iso-ir-58': 'gbk',
195
+ 'x-gbk': 'gbk',
196
+ 'gb18030': 'gb18030',
197
+ 'hz-gb-2312': 'hz-gb-2312',
198
+ 'big5': 'big5',
199
+ 'big5-hkscs': 'big5',
200
+ 'cn-big5': 'big5',
201
+ 'csbig5': 'big5',
202
+ 'x-x-big5': 'big5',
203
+ 'cseucpkdfmtjapanese': 'euc-jp',
204
+ 'euc-jp': 'euc-jp',
205
+ 'x-euc-jp': 'euc-jp',
206
+ 'csiso2022jp': 'iso-2022-jp',
207
+ 'iso-2022-jp': 'iso-2022-jp',
208
+ 'csshiftjis': 'shift_jis',
209
+ 'ms_kanji': 'shift_jis',
210
+ 'shift-jis': 'shift_jis',
211
+ 'shift_jis': 'shift_jis',
212
+ 'sjis': 'shift_jis',
213
+ 'windows-31j': 'shift_jis',
214
+ 'x-sjis': 'shift_jis',
215
+ 'cseuckr': 'euc-kr',
216
+ 'csksc56011987': 'euc-kr',
217
+ 'euc-kr': 'euc-kr',
218
+ 'iso-ir-149': 'euc-kr',
219
+ 'korean': 'euc-kr',
220
+ 'ks_c_5601-1987': 'euc-kr',
221
+ 'ks_c_5601-1989': 'euc-kr',
222
+ 'ksc5601': 'euc-kr',
223
+ 'ksc_5601': 'euc-kr',
224
+ 'windows-949': 'euc-kr',
225
+ 'csiso2022kr': 'iso-2022-kr',
226
+ 'iso-2022-kr': 'iso-2022-kr',
227
+ 'utf-16be': 'utf-16be',
228
+ 'utf-16': 'utf-16le',
229
+ 'utf-16le': 'utf-16le',
230
+ 'x-user-defined': 'x-user-defined',
231
+ }
@@ -0,0 +1,59 @@
1
+ """
2
+
3
+ webencodings.mklabels
4
+ ~~~~~~~~~~~~~~~~~~~~~
5
+
6
+ Regenarate the webencodings.labels module.
7
+
8
+ :copyright: Copyright 2012 by Simon Sapin
9
+ :license: BSD, see LICENSE for details.
10
+
11
+ """
12
+
13
+ import json
14
+ try:
15
+ from urllib import urlopen
16
+ except ImportError:
17
+ from urllib.request import urlopen
18
+
19
+
20
+ def assert_lower(string):
21
+ assert string == string.lower()
22
+ return string
23
+
24
+
25
+ def generate(url):
26
+ parts = ['''\
27
+ """
28
+
29
+ webencodings.labels
30
+ ~~~~~~~~~~~~~~~~~~~
31
+
32
+ Map encoding labels to their name.
33
+
34
+ :copyright: Copyright 2012 by Simon Sapin
35
+ :license: BSD, see LICENSE for details.
36
+
37
+ """
38
+
39
+ # XXX Do not edit!
40
+ # This file is automatically generated by mklabels.py
41
+
42
+ LABELS = {
43
+ ''']
44
+ labels = [
45
+ (repr(assert_lower(label)).lstrip('u'),
46
+ repr(encoding['name']).lstrip('u'))
47
+ for category in json.loads(urlopen(url).read().decode('ascii'))
48
+ for encoding in category['encodings']
49
+ for label in encoding['labels']]
50
+ max_len = max(len(label) for label, name in labels)
51
+ parts.extend(
52
+ ' %s:%s %s,\n' % (label, ' ' * (max_len - len(label)), name)
53
+ for label, name in labels)
54
+ parts.append('}')
55
+ return ''.join(parts)
56
+
57
+
58
+ if __name__ == '__main__':
59
+ print(generate('http://encoding.spec.whatwg.org/encodings.json'))