wandb 0.18.1__py3-none-macosx_11_0_x86_64.whl

Sign up to get free protection for your applications and to get access to all the features.
Files changed (826) hide show
  1. package_readme.md +89 -0
  2. wandb/__init__.py +245 -0
  3. wandb/__init__.pyi +1084 -0
  4. wandb/__main__.py +3 -0
  5. wandb/_globals.py +19 -0
  6. wandb/agents/__init__.py +0 -0
  7. wandb/agents/pyagent.py +363 -0
  8. wandb/analytics/__init__.py +3 -0
  9. wandb/analytics/sentry.py +266 -0
  10. wandb/apis/__init__.py +48 -0
  11. wandb/apis/attrs.py +40 -0
  12. wandb/apis/importers/__init__.py +1 -0
  13. wandb/apis/importers/internals/internal.py +385 -0
  14. wandb/apis/importers/internals/protocols.py +99 -0
  15. wandb/apis/importers/internals/util.py +78 -0
  16. wandb/apis/importers/mlflow.py +254 -0
  17. wandb/apis/importers/validation.py +108 -0
  18. wandb/apis/importers/wandb.py +1603 -0
  19. wandb/apis/internal.py +229 -0
  20. wandb/apis/normalize.py +89 -0
  21. wandb/apis/paginator.py +81 -0
  22. wandb/apis/public/__init__.py +34 -0
  23. wandb/apis/public/api.py +1179 -0
  24. wandb/apis/public/artifacts.py +1086 -0
  25. wandb/apis/public/const.py +4 -0
  26. wandb/apis/public/files.py +195 -0
  27. wandb/apis/public/history.py +149 -0
  28. wandb/apis/public/jobs.py +651 -0
  29. wandb/apis/public/projects.py +154 -0
  30. wandb/apis/public/query_generator.py +166 -0
  31. wandb/apis/public/reports.py +469 -0
  32. wandb/apis/public/runs.py +903 -0
  33. wandb/apis/public/sweeps.py +240 -0
  34. wandb/apis/public/teams.py +198 -0
  35. wandb/apis/public/users.py +136 -0
  36. wandb/apis/reports/__init__.py +1 -0
  37. wandb/apis/reports/v1/__init__.py +8 -0
  38. wandb/apis/reports/v2/__init__.py +8 -0
  39. wandb/apis/workspaces/__init__.py +8 -0
  40. wandb/beta/workflows.py +288 -0
  41. wandb/bin/wandb-core +0 -0
  42. wandb/cli/__init__.py +0 -0
  43. wandb/cli/cli.py +3007 -0
  44. wandb/data_types.py +63 -0
  45. wandb/docker/__init__.py +342 -0
  46. wandb/docker/auth.py +436 -0
  47. wandb/docker/wandb-entrypoint.sh +33 -0
  48. wandb/docker/www_authenticate.py +94 -0
  49. wandb/env.py +514 -0
  50. wandb/errors/__init__.py +46 -0
  51. wandb/errors/term.py +103 -0
  52. wandb/errors/util.py +57 -0
  53. wandb/filesync/__init__.py +0 -0
  54. wandb/filesync/dir_watcher.py +403 -0
  55. wandb/filesync/stats.py +100 -0
  56. wandb/filesync/step_checksum.py +142 -0
  57. wandb/filesync/step_prepare.py +179 -0
  58. wandb/filesync/step_upload.py +290 -0
  59. wandb/filesync/upload_job.py +142 -0
  60. wandb/integration/__init__.py +0 -0
  61. wandb/integration/catboost/__init__.py +5 -0
  62. wandb/integration/catboost/catboost.py +178 -0
  63. wandb/integration/cohere/__init__.py +3 -0
  64. wandb/integration/cohere/cohere.py +21 -0
  65. wandb/integration/cohere/resolver.py +347 -0
  66. wandb/integration/diffusers/__init__.py +3 -0
  67. wandb/integration/diffusers/autologger.py +76 -0
  68. wandb/integration/diffusers/pipeline_resolver.py +50 -0
  69. wandb/integration/diffusers/resolvers/__init__.py +9 -0
  70. wandb/integration/diffusers/resolvers/multimodal.py +882 -0
  71. wandb/integration/diffusers/resolvers/utils.py +102 -0
  72. wandb/integration/fastai/__init__.py +249 -0
  73. wandb/integration/gym/__init__.py +105 -0
  74. wandb/integration/huggingface/__init__.py +3 -0
  75. wandb/integration/huggingface/huggingface.py +18 -0
  76. wandb/integration/huggingface/resolver.py +213 -0
  77. wandb/integration/keras/__init__.py +11 -0
  78. wandb/integration/keras/callbacks/__init__.py +5 -0
  79. wandb/integration/keras/callbacks/metrics_logger.py +136 -0
  80. wandb/integration/keras/callbacks/model_checkpoint.py +195 -0
  81. wandb/integration/keras/callbacks/tables_builder.py +226 -0
  82. wandb/integration/keras/keras.py +1091 -0
  83. wandb/integration/kfp/__init__.py +6 -0
  84. wandb/integration/kfp/helpers.py +28 -0
  85. wandb/integration/kfp/kfp_patch.py +324 -0
  86. wandb/integration/kfp/wandb_logging.py +182 -0
  87. wandb/integration/langchain/__init__.py +3 -0
  88. wandb/integration/langchain/wandb_tracer.py +48 -0
  89. wandb/integration/lightgbm/__init__.py +239 -0
  90. wandb/integration/lightning/__init__.py +0 -0
  91. wandb/integration/lightning/fabric/__init__.py +3 -0
  92. wandb/integration/lightning/fabric/logger.py +762 -0
  93. wandb/integration/magic.py +556 -0
  94. wandb/integration/metaflow/__init__.py +3 -0
  95. wandb/integration/metaflow/metaflow.py +383 -0
  96. wandb/integration/openai/__init__.py +3 -0
  97. wandb/integration/openai/fine_tuning.py +480 -0
  98. wandb/integration/openai/openai.py +22 -0
  99. wandb/integration/openai/resolver.py +240 -0
  100. wandb/integration/prodigy/__init__.py +3 -0
  101. wandb/integration/prodigy/prodigy.py +299 -0
  102. wandb/integration/sacred/__init__.py +117 -0
  103. wandb/integration/sagemaker/__init__.py +12 -0
  104. wandb/integration/sagemaker/auth.py +28 -0
  105. wandb/integration/sagemaker/config.py +49 -0
  106. wandb/integration/sagemaker/files.py +3 -0
  107. wandb/integration/sagemaker/resources.py +34 -0
  108. wandb/integration/sb3/__init__.py +3 -0
  109. wandb/integration/sb3/sb3.py +153 -0
  110. wandb/integration/sklearn/__init__.py +37 -0
  111. wandb/integration/sklearn/calculate/__init__.py +32 -0
  112. wandb/integration/sklearn/calculate/calibration_curves.py +125 -0
  113. wandb/integration/sklearn/calculate/class_proportions.py +68 -0
  114. wandb/integration/sklearn/calculate/confusion_matrix.py +93 -0
  115. wandb/integration/sklearn/calculate/decision_boundaries.py +40 -0
  116. wandb/integration/sklearn/calculate/elbow_curve.py +55 -0
  117. wandb/integration/sklearn/calculate/feature_importances.py +67 -0
  118. wandb/integration/sklearn/calculate/learning_curve.py +64 -0
  119. wandb/integration/sklearn/calculate/outlier_candidates.py +69 -0
  120. wandb/integration/sklearn/calculate/residuals.py +86 -0
  121. wandb/integration/sklearn/calculate/silhouette.py +118 -0
  122. wandb/integration/sklearn/calculate/summary_metrics.py +62 -0
  123. wandb/integration/sklearn/plot/__init__.py +35 -0
  124. wandb/integration/sklearn/plot/classifier.py +329 -0
  125. wandb/integration/sklearn/plot/clusterer.py +146 -0
  126. wandb/integration/sklearn/plot/regressor.py +121 -0
  127. wandb/integration/sklearn/plot/shared.py +91 -0
  128. wandb/integration/sklearn/utils.py +183 -0
  129. wandb/integration/tensorboard/__init__.py +10 -0
  130. wandb/integration/tensorboard/log.py +355 -0
  131. wandb/integration/tensorboard/monkeypatch.py +185 -0
  132. wandb/integration/tensorflow/__init__.py +5 -0
  133. wandb/integration/tensorflow/estimator_hook.py +54 -0
  134. wandb/integration/torch/__init__.py +0 -0
  135. wandb/integration/torch/wandb_torch.py +554 -0
  136. wandb/integration/ultralytics/__init__.py +11 -0
  137. wandb/integration/ultralytics/bbox_utils.py +208 -0
  138. wandb/integration/ultralytics/callback.py +524 -0
  139. wandb/integration/ultralytics/classification_utils.py +83 -0
  140. wandb/integration/ultralytics/mask_utils.py +202 -0
  141. wandb/integration/ultralytics/pose_utils.py +103 -0
  142. wandb/integration/xgboost/__init__.py +11 -0
  143. wandb/integration/xgboost/xgboost.py +189 -0
  144. wandb/integration/yolov8/__init__.py +0 -0
  145. wandb/integration/yolov8/yolov8.py +284 -0
  146. wandb/jupyter.py +515 -0
  147. wandb/magic.py +3 -0
  148. wandb/mpmain/__init__.py +0 -0
  149. wandb/mpmain/__main__.py +1 -0
  150. wandb/old/__init__.py +0 -0
  151. wandb/old/core.py +131 -0
  152. wandb/old/settings.py +173 -0
  153. wandb/old/summary.py +440 -0
  154. wandb/plot/__init__.py +19 -0
  155. wandb/plot/bar.py +42 -0
  156. wandb/plot/confusion_matrix.py +99 -0
  157. wandb/plot/histogram.py +36 -0
  158. wandb/plot/line.py +40 -0
  159. wandb/plot/line_series.py +88 -0
  160. wandb/plot/pr_curve.py +136 -0
  161. wandb/plot/roc_curve.py +118 -0
  162. wandb/plot/scatter.py +32 -0
  163. wandb/plot/utils.py +183 -0
  164. wandb/proto/__init__.py +0 -0
  165. wandb/proto/v3/__init__.py +0 -0
  166. wandb/proto/v3/wandb_base_pb2.py +55 -0
  167. wandb/proto/v3/wandb_internal_pb2.py +1608 -0
  168. wandb/proto/v3/wandb_server_pb2.py +208 -0
  169. wandb/proto/v3/wandb_settings_pb2.py +112 -0
  170. wandb/proto/v3/wandb_telemetry_pb2.py +106 -0
  171. wandb/proto/v4/__init__.py +0 -0
  172. wandb/proto/v4/wandb_base_pb2.py +30 -0
  173. wandb/proto/v4/wandb_internal_pb2.py +360 -0
  174. wandb/proto/v4/wandb_server_pb2.py +63 -0
  175. wandb/proto/v4/wandb_settings_pb2.py +45 -0
  176. wandb/proto/v4/wandb_telemetry_pb2.py +41 -0
  177. wandb/proto/v5/wandb_base_pb2.py +31 -0
  178. wandb/proto/v5/wandb_internal_pb2.py +361 -0
  179. wandb/proto/v5/wandb_server_pb2.py +64 -0
  180. wandb/proto/v5/wandb_settings_pb2.py +46 -0
  181. wandb/proto/v5/wandb_telemetry_pb2.py +42 -0
  182. wandb/proto/wandb_base_pb2.py +10 -0
  183. wandb/proto/wandb_deprecated.py +53 -0
  184. wandb/proto/wandb_generate_deprecated.py +34 -0
  185. wandb/proto/wandb_generate_proto.py +49 -0
  186. wandb/proto/wandb_internal_pb2.py +16 -0
  187. wandb/proto/wandb_server_pb2.py +10 -0
  188. wandb/proto/wandb_settings_pb2.py +10 -0
  189. wandb/proto/wandb_telemetry_pb2.py +10 -0
  190. wandb/py.typed +0 -0
  191. wandb/sdk/__init__.py +37 -0
  192. wandb/sdk/artifacts/__init__.py +0 -0
  193. wandb/sdk/artifacts/_validators.py +45 -0
  194. wandb/sdk/artifacts/artifact.py +2415 -0
  195. wandb/sdk/artifacts/artifact_download_logger.py +43 -0
  196. wandb/sdk/artifacts/artifact_file_cache.py +251 -0
  197. wandb/sdk/artifacts/artifact_instance_cache.py +15 -0
  198. wandb/sdk/artifacts/artifact_manifest.py +72 -0
  199. wandb/sdk/artifacts/artifact_manifest_entry.py +247 -0
  200. wandb/sdk/artifacts/artifact_manifests/__init__.py +0 -0
  201. wandb/sdk/artifacts/artifact_manifests/artifact_manifest_v1.py +90 -0
  202. wandb/sdk/artifacts/artifact_saver.py +267 -0
  203. wandb/sdk/artifacts/artifact_state.py +11 -0
  204. wandb/sdk/artifacts/artifact_ttl.py +7 -0
  205. wandb/sdk/artifacts/exceptions.py +56 -0
  206. wandb/sdk/artifacts/staging.py +25 -0
  207. wandb/sdk/artifacts/storage_handler.py +60 -0
  208. wandb/sdk/artifacts/storage_handlers/__init__.py +0 -0
  209. wandb/sdk/artifacts/storage_handlers/azure_handler.py +206 -0
  210. wandb/sdk/artifacts/storage_handlers/gcs_handler.py +226 -0
  211. wandb/sdk/artifacts/storage_handlers/http_handler.py +113 -0
  212. wandb/sdk/artifacts/storage_handlers/local_file_handler.py +139 -0
  213. wandb/sdk/artifacts/storage_handlers/multi_handler.py +54 -0
  214. wandb/sdk/artifacts/storage_handlers/s3_handler.py +300 -0
  215. wandb/sdk/artifacts/storage_handlers/tracking_handler.py +70 -0
  216. wandb/sdk/artifacts/storage_handlers/wb_artifact_handler.py +133 -0
  217. wandb/sdk/artifacts/storage_handlers/wb_local_artifact_handler.py +72 -0
  218. wandb/sdk/artifacts/storage_layout.py +6 -0
  219. wandb/sdk/artifacts/storage_policies/__init__.py +4 -0
  220. wandb/sdk/artifacts/storage_policies/register.py +1 -0
  221. wandb/sdk/artifacts/storage_policies/wandb_storage_policy.py +376 -0
  222. wandb/sdk/artifacts/storage_policy.py +72 -0
  223. wandb/sdk/backend/__init__.py +0 -0
  224. wandb/sdk/backend/backend.py +240 -0
  225. wandb/sdk/data_types/__init__.py +0 -0
  226. wandb/sdk/data_types/_dtypes.py +914 -0
  227. wandb/sdk/data_types/_private.py +10 -0
  228. wandb/sdk/data_types/audio.py +165 -0
  229. wandb/sdk/data_types/base_types/__init__.py +0 -0
  230. wandb/sdk/data_types/base_types/json_metadata.py +55 -0
  231. wandb/sdk/data_types/base_types/media.py +315 -0
  232. wandb/sdk/data_types/base_types/wb_value.py +274 -0
  233. wandb/sdk/data_types/bokeh.py +70 -0
  234. wandb/sdk/data_types/graph.py +405 -0
  235. wandb/sdk/data_types/helper_types/__init__.py +0 -0
  236. wandb/sdk/data_types/helper_types/bounding_boxes_2d.py +295 -0
  237. wandb/sdk/data_types/helper_types/classes.py +159 -0
  238. wandb/sdk/data_types/helper_types/image_mask.py +235 -0
  239. wandb/sdk/data_types/histogram.py +96 -0
  240. wandb/sdk/data_types/html.py +115 -0
  241. wandb/sdk/data_types/image.py +845 -0
  242. wandb/sdk/data_types/molecule.py +241 -0
  243. wandb/sdk/data_types/object_3d.py +474 -0
  244. wandb/sdk/data_types/plotly.py +82 -0
  245. wandb/sdk/data_types/saved_model.py +446 -0
  246. wandb/sdk/data_types/table.py +1204 -0
  247. wandb/sdk/data_types/trace_tree.py +438 -0
  248. wandb/sdk/data_types/utils.py +229 -0
  249. wandb/sdk/data_types/video.py +247 -0
  250. wandb/sdk/integration_utils/__init__.py +0 -0
  251. wandb/sdk/integration_utils/auto_logging.py +239 -0
  252. wandb/sdk/integration_utils/data_logging.py +475 -0
  253. wandb/sdk/interface/__init__.py +0 -0
  254. wandb/sdk/interface/constants.py +4 -0
  255. wandb/sdk/interface/interface.py +996 -0
  256. wandb/sdk/interface/interface_queue.py +59 -0
  257. wandb/sdk/interface/interface_relay.py +53 -0
  258. wandb/sdk/interface/interface_shared.py +549 -0
  259. wandb/sdk/interface/interface_sock.py +61 -0
  260. wandb/sdk/interface/message_future.py +27 -0
  261. wandb/sdk/interface/message_future_poll.py +50 -0
  262. wandb/sdk/interface/router.py +118 -0
  263. wandb/sdk/interface/router_queue.py +44 -0
  264. wandb/sdk/interface/router_relay.py +39 -0
  265. wandb/sdk/interface/router_sock.py +36 -0
  266. wandb/sdk/interface/summary_record.py +67 -0
  267. wandb/sdk/internal/__init__.py +0 -0
  268. wandb/sdk/internal/context.py +89 -0
  269. wandb/sdk/internal/datastore.py +297 -0
  270. wandb/sdk/internal/file_pusher.py +181 -0
  271. wandb/sdk/internal/file_stream.py +695 -0
  272. wandb/sdk/internal/flow_control.py +263 -0
  273. wandb/sdk/internal/handler.py +911 -0
  274. wandb/sdk/internal/internal.py +417 -0
  275. wandb/sdk/internal/internal_api.py +4287 -0
  276. wandb/sdk/internal/internal_util.py +100 -0
  277. wandb/sdk/internal/job_builder.py +629 -0
  278. wandb/sdk/internal/profiler.py +78 -0
  279. wandb/sdk/internal/progress.py +83 -0
  280. wandb/sdk/internal/run.py +25 -0
  281. wandb/sdk/internal/sample.py +70 -0
  282. wandb/sdk/internal/sender.py +1729 -0
  283. wandb/sdk/internal/sender_config.py +197 -0
  284. wandb/sdk/internal/settings_static.py +90 -0
  285. wandb/sdk/internal/system/__init__.py +0 -0
  286. wandb/sdk/internal/system/assets/__init__.py +27 -0
  287. wandb/sdk/internal/system/assets/aggregators.py +37 -0
  288. wandb/sdk/internal/system/assets/asset_registry.py +20 -0
  289. wandb/sdk/internal/system/assets/cpu.py +163 -0
  290. wandb/sdk/internal/system/assets/disk.py +210 -0
  291. wandb/sdk/internal/system/assets/gpu.py +416 -0
  292. wandb/sdk/internal/system/assets/gpu_amd.py +239 -0
  293. wandb/sdk/internal/system/assets/gpu_apple.py +177 -0
  294. wandb/sdk/internal/system/assets/interfaces.py +207 -0
  295. wandb/sdk/internal/system/assets/ipu.py +177 -0
  296. wandb/sdk/internal/system/assets/memory.py +166 -0
  297. wandb/sdk/internal/system/assets/network.py +125 -0
  298. wandb/sdk/internal/system/assets/open_metrics.py +299 -0
  299. wandb/sdk/internal/system/assets/tpu.py +154 -0
  300. wandb/sdk/internal/system/assets/trainium.py +399 -0
  301. wandb/sdk/internal/system/env_probe_helpers.py +13 -0
  302. wandb/sdk/internal/system/system_info.py +249 -0
  303. wandb/sdk/internal/system/system_monitor.py +229 -0
  304. wandb/sdk/internal/tb_watcher.py +518 -0
  305. wandb/sdk/internal/thread_local_settings.py +18 -0
  306. wandb/sdk/internal/update.py +113 -0
  307. wandb/sdk/internal/writer.py +206 -0
  308. wandb/sdk/launch/__init__.py +14 -0
  309. wandb/sdk/launch/_launch.py +330 -0
  310. wandb/sdk/launch/_launch_add.py +255 -0
  311. wandb/sdk/launch/_project_spec.py +566 -0
  312. wandb/sdk/launch/agent/__init__.py +5 -0
  313. wandb/sdk/launch/agent/agent.py +924 -0
  314. wandb/sdk/launch/agent/config.py +296 -0
  315. wandb/sdk/launch/agent/job_status_tracker.py +53 -0
  316. wandb/sdk/launch/agent/run_queue_item_file_saver.py +45 -0
  317. wandb/sdk/launch/builder/__init__.py +0 -0
  318. wandb/sdk/launch/builder/abstract.py +156 -0
  319. wandb/sdk/launch/builder/build.py +297 -0
  320. wandb/sdk/launch/builder/context_manager.py +235 -0
  321. wandb/sdk/launch/builder/docker_builder.py +177 -0
  322. wandb/sdk/launch/builder/kaniko_builder.py +595 -0
  323. wandb/sdk/launch/builder/noop.py +58 -0
  324. wandb/sdk/launch/builder/templates/_wandb_bootstrap.py +188 -0
  325. wandb/sdk/launch/builder/templates/dockerfile.py +92 -0
  326. wandb/sdk/launch/create_job.py +528 -0
  327. wandb/sdk/launch/environment/abstract.py +29 -0
  328. wandb/sdk/launch/environment/aws_environment.py +322 -0
  329. wandb/sdk/launch/environment/azure_environment.py +105 -0
  330. wandb/sdk/launch/environment/gcp_environment.py +335 -0
  331. wandb/sdk/launch/environment/local_environment.py +66 -0
  332. wandb/sdk/launch/errors.py +19 -0
  333. wandb/sdk/launch/git_reference.py +109 -0
  334. wandb/sdk/launch/inputs/files.py +148 -0
  335. wandb/sdk/launch/inputs/internal.py +315 -0
  336. wandb/sdk/launch/inputs/manage.py +113 -0
  337. wandb/sdk/launch/inputs/schema.py +39 -0
  338. wandb/sdk/launch/loader.py +249 -0
  339. wandb/sdk/launch/registry/abstract.py +48 -0
  340. wandb/sdk/launch/registry/anon.py +29 -0
  341. wandb/sdk/launch/registry/azure_container_registry.py +124 -0
  342. wandb/sdk/launch/registry/elastic_container_registry.py +192 -0
  343. wandb/sdk/launch/registry/google_artifact_registry.py +219 -0
  344. wandb/sdk/launch/registry/local_registry.py +67 -0
  345. wandb/sdk/launch/runner/__init__.py +0 -0
  346. wandb/sdk/launch/runner/abstract.py +195 -0
  347. wandb/sdk/launch/runner/kubernetes_monitor.py +474 -0
  348. wandb/sdk/launch/runner/kubernetes_runner.py +963 -0
  349. wandb/sdk/launch/runner/local_container.py +301 -0
  350. wandb/sdk/launch/runner/local_process.py +78 -0
  351. wandb/sdk/launch/runner/sagemaker_runner.py +426 -0
  352. wandb/sdk/launch/runner/vertex_runner.py +230 -0
  353. wandb/sdk/launch/sweeps/__init__.py +39 -0
  354. wandb/sdk/launch/sweeps/scheduler.py +742 -0
  355. wandb/sdk/launch/sweeps/scheduler_sweep.py +91 -0
  356. wandb/sdk/launch/sweeps/utils.py +316 -0
  357. wandb/sdk/launch/utils.py +746 -0
  358. wandb/sdk/launch/wandb_reference.py +138 -0
  359. wandb/sdk/lib/__init__.py +5 -0
  360. wandb/sdk/lib/_settings_toposort_generate.py +159 -0
  361. wandb/sdk/lib/_settings_toposort_generated.py +249 -0
  362. wandb/sdk/lib/_wburls_generate.py +25 -0
  363. wandb/sdk/lib/_wburls_generated.py +22 -0
  364. wandb/sdk/lib/apikey.py +273 -0
  365. wandb/sdk/lib/capped_dict.py +26 -0
  366. wandb/sdk/lib/config_util.py +101 -0
  367. wandb/sdk/lib/credentials.py +141 -0
  368. wandb/sdk/lib/deprecate.py +42 -0
  369. wandb/sdk/lib/disabled.py +29 -0
  370. wandb/sdk/lib/exit_hooks.py +54 -0
  371. wandb/sdk/lib/file_stream_utils.py +118 -0
  372. wandb/sdk/lib/filenames.py +64 -0
  373. wandb/sdk/lib/filesystem.py +372 -0
  374. wandb/sdk/lib/fsm.py +174 -0
  375. wandb/sdk/lib/gitlib.py +239 -0
  376. wandb/sdk/lib/gql_request.py +65 -0
  377. wandb/sdk/lib/handler_util.py +21 -0
  378. wandb/sdk/lib/hashutil.py +62 -0
  379. wandb/sdk/lib/import_hooks.py +275 -0
  380. wandb/sdk/lib/ipython.py +146 -0
  381. wandb/sdk/lib/json_util.py +80 -0
  382. wandb/sdk/lib/lazyloader.py +63 -0
  383. wandb/sdk/lib/mailbox.py +460 -0
  384. wandb/sdk/lib/module.py +69 -0
  385. wandb/sdk/lib/paths.py +106 -0
  386. wandb/sdk/lib/preinit.py +42 -0
  387. wandb/sdk/lib/printer.py +313 -0
  388. wandb/sdk/lib/proto_util.py +90 -0
  389. wandb/sdk/lib/redirect.py +845 -0
  390. wandb/sdk/lib/reporting.py +99 -0
  391. wandb/sdk/lib/retry.py +289 -0
  392. wandb/sdk/lib/run_moment.py +78 -0
  393. wandb/sdk/lib/runid.py +12 -0
  394. wandb/sdk/lib/server.py +52 -0
  395. wandb/sdk/lib/sock_client.py +291 -0
  396. wandb/sdk/lib/sparkline.py +45 -0
  397. wandb/sdk/lib/telemetry.py +100 -0
  398. wandb/sdk/lib/timed_input.py +133 -0
  399. wandb/sdk/lib/timer.py +19 -0
  400. wandb/sdk/lib/tracelog.py +255 -0
  401. wandb/sdk/lib/viz.py +123 -0
  402. wandb/sdk/lib/wburls.py +46 -0
  403. wandb/sdk/service/__init__.py +0 -0
  404. wandb/sdk/service/_startup_debug.py +22 -0
  405. wandb/sdk/service/port_file.py +53 -0
  406. wandb/sdk/service/server.py +119 -0
  407. wandb/sdk/service/server_sock.py +276 -0
  408. wandb/sdk/service/service.py +264 -0
  409. wandb/sdk/service/service_base.py +50 -0
  410. wandb/sdk/service/service_sock.py +70 -0
  411. wandb/sdk/service/streams.py +417 -0
  412. wandb/sdk/verify/__init__.py +0 -0
  413. wandb/sdk/verify/verify.py +501 -0
  414. wandb/sdk/wandb_alerts.py +12 -0
  415. wandb/sdk/wandb_config.py +322 -0
  416. wandb/sdk/wandb_helper.py +54 -0
  417. wandb/sdk/wandb_init.py +1256 -0
  418. wandb/sdk/wandb_login.py +349 -0
  419. wandb/sdk/wandb_manager.py +232 -0
  420. wandb/sdk/wandb_metric.py +110 -0
  421. wandb/sdk/wandb_require.py +97 -0
  422. wandb/sdk/wandb_require_helpers.py +44 -0
  423. wandb/sdk/wandb_run.py +4231 -0
  424. wandb/sdk/wandb_settings.py +1999 -0
  425. wandb/sdk/wandb_setup.py +400 -0
  426. wandb/sdk/wandb_summary.py +150 -0
  427. wandb/sdk/wandb_sweep.py +119 -0
  428. wandb/sdk/wandb_sync.py +75 -0
  429. wandb/sdk/wandb_watch.py +128 -0
  430. wandb/sklearn.py +35 -0
  431. wandb/sync/__init__.py +3 -0
  432. wandb/sync/sync.py +443 -0
  433. wandb/trigger.py +29 -0
  434. wandb/util.py +1949 -0
  435. wandb/vendor/__init__.py +0 -0
  436. wandb/vendor/gql-0.2.0/setup.py +40 -0
  437. wandb/vendor/gql-0.2.0/tests/__init__.py +0 -0
  438. wandb/vendor/gql-0.2.0/tests/starwars/__init__.py +0 -0
  439. wandb/vendor/gql-0.2.0/tests/starwars/fixtures.py +96 -0
  440. wandb/vendor/gql-0.2.0/tests/starwars/schema.py +146 -0
  441. wandb/vendor/gql-0.2.0/tests/starwars/test_dsl.py +293 -0
  442. wandb/vendor/gql-0.2.0/tests/starwars/test_query.py +355 -0
  443. wandb/vendor/gql-0.2.0/tests/starwars/test_validation.py +171 -0
  444. wandb/vendor/gql-0.2.0/tests/test_client.py +31 -0
  445. wandb/vendor/gql-0.2.0/tests/test_transport.py +89 -0
  446. wandb/vendor/gql-0.2.0/wandb_gql/__init__.py +4 -0
  447. wandb/vendor/gql-0.2.0/wandb_gql/client.py +75 -0
  448. wandb/vendor/gql-0.2.0/wandb_gql/dsl.py +152 -0
  449. wandb/vendor/gql-0.2.0/wandb_gql/gql.py +10 -0
  450. wandb/vendor/gql-0.2.0/wandb_gql/transport/__init__.py +0 -0
  451. wandb/vendor/gql-0.2.0/wandb_gql/transport/http.py +6 -0
  452. wandb/vendor/gql-0.2.0/wandb_gql/transport/local_schema.py +15 -0
  453. wandb/vendor/gql-0.2.0/wandb_gql/transport/requests.py +46 -0
  454. wandb/vendor/gql-0.2.0/wandb_gql/utils.py +21 -0
  455. wandb/vendor/graphql-core-1.1/setup.py +86 -0
  456. wandb/vendor/graphql-core-1.1/wandb_graphql/__init__.py +287 -0
  457. wandb/vendor/graphql-core-1.1/wandb_graphql/error/__init__.py +6 -0
  458. wandb/vendor/graphql-core-1.1/wandb_graphql/error/base.py +42 -0
  459. wandb/vendor/graphql-core-1.1/wandb_graphql/error/format_error.py +11 -0
  460. wandb/vendor/graphql-core-1.1/wandb_graphql/error/located_error.py +29 -0
  461. wandb/vendor/graphql-core-1.1/wandb_graphql/error/syntax_error.py +36 -0
  462. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/__init__.py +26 -0
  463. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/base.py +311 -0
  464. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executor.py +398 -0
  465. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executors/__init__.py +0 -0
  466. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executors/asyncio.py +53 -0
  467. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executors/gevent.py +22 -0
  468. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executors/process.py +32 -0
  469. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executors/sync.py +7 -0
  470. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executors/thread.py +35 -0
  471. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executors/utils.py +6 -0
  472. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/experimental/__init__.py +0 -0
  473. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/experimental/executor.py +66 -0
  474. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/experimental/fragment.py +252 -0
  475. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/experimental/resolver.py +151 -0
  476. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/experimental/utils.py +7 -0
  477. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/middleware.py +57 -0
  478. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/values.py +145 -0
  479. wandb/vendor/graphql-core-1.1/wandb_graphql/graphql.py +60 -0
  480. wandb/vendor/graphql-core-1.1/wandb_graphql/language/__init__.py +0 -0
  481. wandb/vendor/graphql-core-1.1/wandb_graphql/language/ast.py +1349 -0
  482. wandb/vendor/graphql-core-1.1/wandb_graphql/language/base.py +19 -0
  483. wandb/vendor/graphql-core-1.1/wandb_graphql/language/lexer.py +435 -0
  484. wandb/vendor/graphql-core-1.1/wandb_graphql/language/location.py +30 -0
  485. wandb/vendor/graphql-core-1.1/wandb_graphql/language/parser.py +779 -0
  486. wandb/vendor/graphql-core-1.1/wandb_graphql/language/printer.py +193 -0
  487. wandb/vendor/graphql-core-1.1/wandb_graphql/language/source.py +18 -0
  488. wandb/vendor/graphql-core-1.1/wandb_graphql/language/visitor.py +222 -0
  489. wandb/vendor/graphql-core-1.1/wandb_graphql/language/visitor_meta.py +82 -0
  490. wandb/vendor/graphql-core-1.1/wandb_graphql/pyutils/__init__.py +0 -0
  491. wandb/vendor/graphql-core-1.1/wandb_graphql/pyutils/cached_property.py +17 -0
  492. wandb/vendor/graphql-core-1.1/wandb_graphql/pyutils/contain_subset.py +28 -0
  493. wandb/vendor/graphql-core-1.1/wandb_graphql/pyutils/default_ordered_dict.py +40 -0
  494. wandb/vendor/graphql-core-1.1/wandb_graphql/pyutils/ordereddict.py +8 -0
  495. wandb/vendor/graphql-core-1.1/wandb_graphql/pyutils/pair_set.py +43 -0
  496. wandb/vendor/graphql-core-1.1/wandb_graphql/pyutils/version.py +78 -0
  497. wandb/vendor/graphql-core-1.1/wandb_graphql/type/__init__.py +67 -0
  498. wandb/vendor/graphql-core-1.1/wandb_graphql/type/definition.py +619 -0
  499. wandb/vendor/graphql-core-1.1/wandb_graphql/type/directives.py +132 -0
  500. wandb/vendor/graphql-core-1.1/wandb_graphql/type/introspection.py +440 -0
  501. wandb/vendor/graphql-core-1.1/wandb_graphql/type/scalars.py +131 -0
  502. wandb/vendor/graphql-core-1.1/wandb_graphql/type/schema.py +100 -0
  503. wandb/vendor/graphql-core-1.1/wandb_graphql/type/typemap.py +145 -0
  504. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/__init__.py +0 -0
  505. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/assert_valid_name.py +9 -0
  506. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/ast_from_value.py +65 -0
  507. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/ast_to_code.py +49 -0
  508. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/ast_to_dict.py +24 -0
  509. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/base.py +75 -0
  510. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/build_ast_schema.py +291 -0
  511. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/build_client_schema.py +250 -0
  512. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/concat_ast.py +9 -0
  513. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/extend_schema.py +357 -0
  514. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/get_field_def.py +27 -0
  515. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/get_operation_ast.py +21 -0
  516. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/introspection_query.py +90 -0
  517. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/is_valid_literal_value.py +67 -0
  518. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/is_valid_value.py +66 -0
  519. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/quoted_or_list.py +21 -0
  520. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/schema_printer.py +168 -0
  521. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/suggestion_list.py +56 -0
  522. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/type_comparators.py +69 -0
  523. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/type_from_ast.py +21 -0
  524. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/type_info.py +149 -0
  525. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/value_from_ast.py +69 -0
  526. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/__init__.py +4 -0
  527. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/__init__.py +79 -0
  528. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/arguments_of_correct_type.py +24 -0
  529. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/base.py +8 -0
  530. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/default_values_of_correct_type.py +44 -0
  531. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/fields_on_correct_type.py +113 -0
  532. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/fragments_on_composite_types.py +33 -0
  533. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/known_argument_names.py +70 -0
  534. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/known_directives.py +97 -0
  535. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/known_fragment_names.py +19 -0
  536. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/known_type_names.py +43 -0
  537. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/lone_anonymous_operation.py +23 -0
  538. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/no_fragment_cycles.py +59 -0
  539. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/no_undefined_variables.py +36 -0
  540. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/no_unused_fragments.py +38 -0
  541. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/no_unused_variables.py +37 -0
  542. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/overlapping_fields_can_be_merged.py +529 -0
  543. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/possible_fragment_spreads.py +44 -0
  544. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/provided_non_null_arguments.py +46 -0
  545. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/scalar_leafs.py +33 -0
  546. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/unique_argument_names.py +32 -0
  547. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/unique_fragment_names.py +28 -0
  548. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/unique_input_field_names.py +33 -0
  549. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/unique_operation_names.py +31 -0
  550. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/unique_variable_names.py +27 -0
  551. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/variables_are_input_types.py +21 -0
  552. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/variables_in_allowed_position.py +53 -0
  553. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/validation.py +158 -0
  554. wandb/vendor/promise-2.3.0/conftest.py +30 -0
  555. wandb/vendor/promise-2.3.0/setup.py +64 -0
  556. wandb/vendor/promise-2.3.0/tests/__init__.py +0 -0
  557. wandb/vendor/promise-2.3.0/tests/conftest.py +8 -0
  558. wandb/vendor/promise-2.3.0/tests/test_awaitable.py +32 -0
  559. wandb/vendor/promise-2.3.0/tests/test_awaitable_35.py +47 -0
  560. wandb/vendor/promise-2.3.0/tests/test_benchmark.py +116 -0
  561. wandb/vendor/promise-2.3.0/tests/test_complex_threads.py +23 -0
  562. wandb/vendor/promise-2.3.0/tests/test_dataloader.py +452 -0
  563. wandb/vendor/promise-2.3.0/tests/test_dataloader_awaitable_35.py +99 -0
  564. wandb/vendor/promise-2.3.0/tests/test_dataloader_extra.py +65 -0
  565. wandb/vendor/promise-2.3.0/tests/test_extra.py +670 -0
  566. wandb/vendor/promise-2.3.0/tests/test_issues.py +132 -0
  567. wandb/vendor/promise-2.3.0/tests/test_promise_list.py +70 -0
  568. wandb/vendor/promise-2.3.0/tests/test_spec.py +584 -0
  569. wandb/vendor/promise-2.3.0/tests/test_thread_safety.py +115 -0
  570. wandb/vendor/promise-2.3.0/tests/utils.py +3 -0
  571. wandb/vendor/promise-2.3.0/wandb_promise/__init__.py +38 -0
  572. wandb/vendor/promise-2.3.0/wandb_promise/async_.py +135 -0
  573. wandb/vendor/promise-2.3.0/wandb_promise/compat.py +32 -0
  574. wandb/vendor/promise-2.3.0/wandb_promise/dataloader.py +326 -0
  575. wandb/vendor/promise-2.3.0/wandb_promise/iterate_promise.py +12 -0
  576. wandb/vendor/promise-2.3.0/wandb_promise/promise.py +848 -0
  577. wandb/vendor/promise-2.3.0/wandb_promise/promise_list.py +151 -0
  578. wandb/vendor/promise-2.3.0/wandb_promise/pyutils/__init__.py +0 -0
  579. wandb/vendor/promise-2.3.0/wandb_promise/pyutils/version.py +83 -0
  580. wandb/vendor/promise-2.3.0/wandb_promise/schedulers/__init__.py +0 -0
  581. wandb/vendor/promise-2.3.0/wandb_promise/schedulers/asyncio.py +22 -0
  582. wandb/vendor/promise-2.3.0/wandb_promise/schedulers/gevent.py +21 -0
  583. wandb/vendor/promise-2.3.0/wandb_promise/schedulers/immediate.py +27 -0
  584. wandb/vendor/promise-2.3.0/wandb_promise/schedulers/thread.py +18 -0
  585. wandb/vendor/promise-2.3.0/wandb_promise/utils.py +56 -0
  586. wandb/vendor/pygments/__init__.py +90 -0
  587. wandb/vendor/pygments/cmdline.py +568 -0
  588. wandb/vendor/pygments/console.py +74 -0
  589. wandb/vendor/pygments/filter.py +74 -0
  590. wandb/vendor/pygments/filters/__init__.py +350 -0
  591. wandb/vendor/pygments/formatter.py +95 -0
  592. wandb/vendor/pygments/formatters/__init__.py +153 -0
  593. wandb/vendor/pygments/formatters/_mapping.py +85 -0
  594. wandb/vendor/pygments/formatters/bbcode.py +109 -0
  595. wandb/vendor/pygments/formatters/html.py +851 -0
  596. wandb/vendor/pygments/formatters/img.py +600 -0
  597. wandb/vendor/pygments/formatters/irc.py +182 -0
  598. wandb/vendor/pygments/formatters/latex.py +482 -0
  599. wandb/vendor/pygments/formatters/other.py +160 -0
  600. wandb/vendor/pygments/formatters/rtf.py +147 -0
  601. wandb/vendor/pygments/formatters/svg.py +153 -0
  602. wandb/vendor/pygments/formatters/terminal.py +136 -0
  603. wandb/vendor/pygments/formatters/terminal256.py +309 -0
  604. wandb/vendor/pygments/lexer.py +871 -0
  605. wandb/vendor/pygments/lexers/__init__.py +329 -0
  606. wandb/vendor/pygments/lexers/_asy_builtins.py +1645 -0
  607. wandb/vendor/pygments/lexers/_cl_builtins.py +232 -0
  608. wandb/vendor/pygments/lexers/_cocoa_builtins.py +72 -0
  609. wandb/vendor/pygments/lexers/_csound_builtins.py +1346 -0
  610. wandb/vendor/pygments/lexers/_lasso_builtins.py +5327 -0
  611. wandb/vendor/pygments/lexers/_lua_builtins.py +295 -0
  612. wandb/vendor/pygments/lexers/_mapping.py +500 -0
  613. wandb/vendor/pygments/lexers/_mql_builtins.py +1172 -0
  614. wandb/vendor/pygments/lexers/_openedge_builtins.py +2547 -0
  615. wandb/vendor/pygments/lexers/_php_builtins.py +4756 -0
  616. wandb/vendor/pygments/lexers/_postgres_builtins.py +621 -0
  617. wandb/vendor/pygments/lexers/_scilab_builtins.py +3094 -0
  618. wandb/vendor/pygments/lexers/_sourcemod_builtins.py +1163 -0
  619. wandb/vendor/pygments/lexers/_stan_builtins.py +532 -0
  620. wandb/vendor/pygments/lexers/_stata_builtins.py +419 -0
  621. wandb/vendor/pygments/lexers/_tsql_builtins.py +1004 -0
  622. wandb/vendor/pygments/lexers/_vim_builtins.py +1939 -0
  623. wandb/vendor/pygments/lexers/actionscript.py +240 -0
  624. wandb/vendor/pygments/lexers/agile.py +24 -0
  625. wandb/vendor/pygments/lexers/algebra.py +221 -0
  626. wandb/vendor/pygments/lexers/ambient.py +76 -0
  627. wandb/vendor/pygments/lexers/ampl.py +87 -0
  628. wandb/vendor/pygments/lexers/apl.py +101 -0
  629. wandb/vendor/pygments/lexers/archetype.py +318 -0
  630. wandb/vendor/pygments/lexers/asm.py +641 -0
  631. wandb/vendor/pygments/lexers/automation.py +374 -0
  632. wandb/vendor/pygments/lexers/basic.py +500 -0
  633. wandb/vendor/pygments/lexers/bibtex.py +160 -0
  634. wandb/vendor/pygments/lexers/business.py +612 -0
  635. wandb/vendor/pygments/lexers/c_cpp.py +252 -0
  636. wandb/vendor/pygments/lexers/c_like.py +541 -0
  637. wandb/vendor/pygments/lexers/capnproto.py +78 -0
  638. wandb/vendor/pygments/lexers/chapel.py +102 -0
  639. wandb/vendor/pygments/lexers/clean.py +288 -0
  640. wandb/vendor/pygments/lexers/compiled.py +34 -0
  641. wandb/vendor/pygments/lexers/configs.py +833 -0
  642. wandb/vendor/pygments/lexers/console.py +114 -0
  643. wandb/vendor/pygments/lexers/crystal.py +393 -0
  644. wandb/vendor/pygments/lexers/csound.py +366 -0
  645. wandb/vendor/pygments/lexers/css.py +689 -0
  646. wandb/vendor/pygments/lexers/d.py +251 -0
  647. wandb/vendor/pygments/lexers/dalvik.py +125 -0
  648. wandb/vendor/pygments/lexers/data.py +555 -0
  649. wandb/vendor/pygments/lexers/diff.py +165 -0
  650. wandb/vendor/pygments/lexers/dotnet.py +691 -0
  651. wandb/vendor/pygments/lexers/dsls.py +878 -0
  652. wandb/vendor/pygments/lexers/dylan.py +289 -0
  653. wandb/vendor/pygments/lexers/ecl.py +125 -0
  654. wandb/vendor/pygments/lexers/eiffel.py +65 -0
  655. wandb/vendor/pygments/lexers/elm.py +121 -0
  656. wandb/vendor/pygments/lexers/erlang.py +533 -0
  657. wandb/vendor/pygments/lexers/esoteric.py +277 -0
  658. wandb/vendor/pygments/lexers/ezhil.py +69 -0
  659. wandb/vendor/pygments/lexers/factor.py +344 -0
  660. wandb/vendor/pygments/lexers/fantom.py +250 -0
  661. wandb/vendor/pygments/lexers/felix.py +273 -0
  662. wandb/vendor/pygments/lexers/forth.py +177 -0
  663. wandb/vendor/pygments/lexers/fortran.py +205 -0
  664. wandb/vendor/pygments/lexers/foxpro.py +428 -0
  665. wandb/vendor/pygments/lexers/functional.py +21 -0
  666. wandb/vendor/pygments/lexers/go.py +101 -0
  667. wandb/vendor/pygments/lexers/grammar_notation.py +213 -0
  668. wandb/vendor/pygments/lexers/graph.py +80 -0
  669. wandb/vendor/pygments/lexers/graphics.py +553 -0
  670. wandb/vendor/pygments/lexers/haskell.py +843 -0
  671. wandb/vendor/pygments/lexers/haxe.py +936 -0
  672. wandb/vendor/pygments/lexers/hdl.py +382 -0
  673. wandb/vendor/pygments/lexers/hexdump.py +103 -0
  674. wandb/vendor/pygments/lexers/html.py +602 -0
  675. wandb/vendor/pygments/lexers/idl.py +270 -0
  676. wandb/vendor/pygments/lexers/igor.py +288 -0
  677. wandb/vendor/pygments/lexers/inferno.py +96 -0
  678. wandb/vendor/pygments/lexers/installers.py +322 -0
  679. wandb/vendor/pygments/lexers/int_fiction.py +1343 -0
  680. wandb/vendor/pygments/lexers/iolang.py +63 -0
  681. wandb/vendor/pygments/lexers/j.py +146 -0
  682. wandb/vendor/pygments/lexers/javascript.py +1525 -0
  683. wandb/vendor/pygments/lexers/julia.py +333 -0
  684. wandb/vendor/pygments/lexers/jvm.py +1573 -0
  685. wandb/vendor/pygments/lexers/lisp.py +2621 -0
  686. wandb/vendor/pygments/lexers/make.py +202 -0
  687. wandb/vendor/pygments/lexers/markup.py +595 -0
  688. wandb/vendor/pygments/lexers/math.py +21 -0
  689. wandb/vendor/pygments/lexers/matlab.py +663 -0
  690. wandb/vendor/pygments/lexers/ml.py +769 -0
  691. wandb/vendor/pygments/lexers/modeling.py +358 -0
  692. wandb/vendor/pygments/lexers/modula2.py +1561 -0
  693. wandb/vendor/pygments/lexers/monte.py +204 -0
  694. wandb/vendor/pygments/lexers/ncl.py +894 -0
  695. wandb/vendor/pygments/lexers/nimrod.py +159 -0
  696. wandb/vendor/pygments/lexers/nit.py +64 -0
  697. wandb/vendor/pygments/lexers/nix.py +136 -0
  698. wandb/vendor/pygments/lexers/oberon.py +105 -0
  699. wandb/vendor/pygments/lexers/objective.py +504 -0
  700. wandb/vendor/pygments/lexers/ooc.py +85 -0
  701. wandb/vendor/pygments/lexers/other.py +41 -0
  702. wandb/vendor/pygments/lexers/parasail.py +79 -0
  703. wandb/vendor/pygments/lexers/parsers.py +835 -0
  704. wandb/vendor/pygments/lexers/pascal.py +644 -0
  705. wandb/vendor/pygments/lexers/pawn.py +199 -0
  706. wandb/vendor/pygments/lexers/perl.py +620 -0
  707. wandb/vendor/pygments/lexers/php.py +267 -0
  708. wandb/vendor/pygments/lexers/praat.py +294 -0
  709. wandb/vendor/pygments/lexers/prolog.py +306 -0
  710. wandb/vendor/pygments/lexers/python.py +939 -0
  711. wandb/vendor/pygments/lexers/qvt.py +152 -0
  712. wandb/vendor/pygments/lexers/r.py +453 -0
  713. wandb/vendor/pygments/lexers/rdf.py +270 -0
  714. wandb/vendor/pygments/lexers/rebol.py +431 -0
  715. wandb/vendor/pygments/lexers/resource.py +85 -0
  716. wandb/vendor/pygments/lexers/rnc.py +67 -0
  717. wandb/vendor/pygments/lexers/roboconf.py +82 -0
  718. wandb/vendor/pygments/lexers/robotframework.py +560 -0
  719. wandb/vendor/pygments/lexers/ruby.py +519 -0
  720. wandb/vendor/pygments/lexers/rust.py +220 -0
  721. wandb/vendor/pygments/lexers/sas.py +228 -0
  722. wandb/vendor/pygments/lexers/scripting.py +1222 -0
  723. wandb/vendor/pygments/lexers/shell.py +794 -0
  724. wandb/vendor/pygments/lexers/smalltalk.py +195 -0
  725. wandb/vendor/pygments/lexers/smv.py +79 -0
  726. wandb/vendor/pygments/lexers/snobol.py +83 -0
  727. wandb/vendor/pygments/lexers/special.py +103 -0
  728. wandb/vendor/pygments/lexers/sql.py +681 -0
  729. wandb/vendor/pygments/lexers/stata.py +108 -0
  730. wandb/vendor/pygments/lexers/supercollider.py +90 -0
  731. wandb/vendor/pygments/lexers/tcl.py +145 -0
  732. wandb/vendor/pygments/lexers/templates.py +2283 -0
  733. wandb/vendor/pygments/lexers/testing.py +207 -0
  734. wandb/vendor/pygments/lexers/text.py +25 -0
  735. wandb/vendor/pygments/lexers/textedit.py +169 -0
  736. wandb/vendor/pygments/lexers/textfmts.py +297 -0
  737. wandb/vendor/pygments/lexers/theorem.py +458 -0
  738. wandb/vendor/pygments/lexers/trafficscript.py +54 -0
  739. wandb/vendor/pygments/lexers/typoscript.py +226 -0
  740. wandb/vendor/pygments/lexers/urbi.py +133 -0
  741. wandb/vendor/pygments/lexers/varnish.py +190 -0
  742. wandb/vendor/pygments/lexers/verification.py +111 -0
  743. wandb/vendor/pygments/lexers/web.py +24 -0
  744. wandb/vendor/pygments/lexers/webmisc.py +988 -0
  745. wandb/vendor/pygments/lexers/whiley.py +116 -0
  746. wandb/vendor/pygments/lexers/x10.py +69 -0
  747. wandb/vendor/pygments/modeline.py +44 -0
  748. wandb/vendor/pygments/plugin.py +68 -0
  749. wandb/vendor/pygments/regexopt.py +92 -0
  750. wandb/vendor/pygments/scanner.py +105 -0
  751. wandb/vendor/pygments/sphinxext.py +158 -0
  752. wandb/vendor/pygments/style.py +155 -0
  753. wandb/vendor/pygments/styles/__init__.py +80 -0
  754. wandb/vendor/pygments/styles/abap.py +29 -0
  755. wandb/vendor/pygments/styles/algol.py +63 -0
  756. wandb/vendor/pygments/styles/algol_nu.py +63 -0
  757. wandb/vendor/pygments/styles/arduino.py +98 -0
  758. wandb/vendor/pygments/styles/autumn.py +65 -0
  759. wandb/vendor/pygments/styles/borland.py +51 -0
  760. wandb/vendor/pygments/styles/bw.py +49 -0
  761. wandb/vendor/pygments/styles/colorful.py +81 -0
  762. wandb/vendor/pygments/styles/default.py +73 -0
  763. wandb/vendor/pygments/styles/emacs.py +72 -0
  764. wandb/vendor/pygments/styles/friendly.py +72 -0
  765. wandb/vendor/pygments/styles/fruity.py +42 -0
  766. wandb/vendor/pygments/styles/igor.py +29 -0
  767. wandb/vendor/pygments/styles/lovelace.py +97 -0
  768. wandb/vendor/pygments/styles/manni.py +75 -0
  769. wandb/vendor/pygments/styles/monokai.py +106 -0
  770. wandb/vendor/pygments/styles/murphy.py +80 -0
  771. wandb/vendor/pygments/styles/native.py +65 -0
  772. wandb/vendor/pygments/styles/paraiso_dark.py +125 -0
  773. wandb/vendor/pygments/styles/paraiso_light.py +125 -0
  774. wandb/vendor/pygments/styles/pastie.py +75 -0
  775. wandb/vendor/pygments/styles/perldoc.py +69 -0
  776. wandb/vendor/pygments/styles/rainbow_dash.py +89 -0
  777. wandb/vendor/pygments/styles/rrt.py +33 -0
  778. wandb/vendor/pygments/styles/sas.py +44 -0
  779. wandb/vendor/pygments/styles/stata.py +40 -0
  780. wandb/vendor/pygments/styles/tango.py +141 -0
  781. wandb/vendor/pygments/styles/trac.py +63 -0
  782. wandb/vendor/pygments/styles/vim.py +63 -0
  783. wandb/vendor/pygments/styles/vs.py +38 -0
  784. wandb/vendor/pygments/styles/xcode.py +51 -0
  785. wandb/vendor/pygments/token.py +213 -0
  786. wandb/vendor/pygments/unistring.py +217 -0
  787. wandb/vendor/pygments/util.py +388 -0
  788. wandb/vendor/pynvml/__init__.py +0 -0
  789. wandb/vendor/pynvml/pynvml.py +4779 -0
  790. wandb/vendor/watchdog_0_9_0/wandb_watchdog/__init__.py +17 -0
  791. wandb/vendor/watchdog_0_9_0/wandb_watchdog/events.py +615 -0
  792. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/__init__.py +98 -0
  793. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/api.py +369 -0
  794. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/fsevents.py +172 -0
  795. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/fsevents2.py +239 -0
  796. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/inotify.py +218 -0
  797. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/inotify_buffer.py +81 -0
  798. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/inotify_c.py +575 -0
  799. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/kqueue.py +730 -0
  800. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/polling.py +145 -0
  801. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/read_directory_changes.py +133 -0
  802. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/winapi.py +348 -0
  803. wandb/vendor/watchdog_0_9_0/wandb_watchdog/patterns.py +265 -0
  804. wandb/vendor/watchdog_0_9_0/wandb_watchdog/tricks/__init__.py +174 -0
  805. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/__init__.py +151 -0
  806. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/bricks.py +249 -0
  807. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/compat.py +29 -0
  808. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/decorators.py +198 -0
  809. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/delayed_queue.py +88 -0
  810. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/dirsnapshot.py +293 -0
  811. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/echo.py +157 -0
  812. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/event_backport.py +41 -0
  813. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/importlib2.py +40 -0
  814. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/platform.py +57 -0
  815. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/unicode_paths.py +64 -0
  816. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/win32stat.py +123 -0
  817. wandb/vendor/watchdog_0_9_0/wandb_watchdog/version.py +28 -0
  818. wandb/vendor/watchdog_0_9_0/wandb_watchdog/watchmedo.py +577 -0
  819. wandb/wandb_agent.py +588 -0
  820. wandb/wandb_controller.py +721 -0
  821. wandb/wandb_run.py +9 -0
  822. wandb-0.18.1.dist-info/METADATA +212 -0
  823. wandb-0.18.1.dist-info/RECORD +826 -0
  824. wandb-0.18.1.dist-info/WHEEL +4 -0
  825. wandb-0.18.1.dist-info/entry_points.txt +3 -0
  826. wandb-0.18.1.dist-info/licenses/LICENSE +21 -0
@@ -0,0 +1,1729 @@
1
+ """sender."""
2
+
3
+ import contextlib
4
+ import gzip
5
+ import json
6
+ import logging
7
+ import os
8
+ import queue
9
+ import sys
10
+ import threading
11
+ import time
12
+ import traceback
13
+ from collections import defaultdict
14
+ from datetime import datetime
15
+ from queue import Queue
16
+ from typing import (
17
+ TYPE_CHECKING,
18
+ Any,
19
+ Dict,
20
+ Generator,
21
+ List,
22
+ Optional,
23
+ Tuple,
24
+ Type,
25
+ Union,
26
+ )
27
+
28
+ import requests
29
+
30
+ import wandb
31
+ from wandb import util
32
+ from wandb.errors import CommError, UsageError
33
+ from wandb.errors.util import ProtobufErrorHandler
34
+ from wandb.filesync.dir_watcher import DirWatcher
35
+ from wandb.proto import wandb_internal_pb2
36
+ from wandb.sdk.artifacts.artifact_saver import ArtifactSaver
37
+ from wandb.sdk.interface import interface
38
+ from wandb.sdk.interface.interface_queue import InterfaceQueue
39
+ from wandb.sdk.internal import (
40
+ context,
41
+ datastore,
42
+ file_stream,
43
+ internal_api,
44
+ sender_config,
45
+ update,
46
+ )
47
+ from wandb.sdk.internal.file_pusher import FilePusher
48
+ from wandb.sdk.internal.job_builder import JobBuilder
49
+ from wandb.sdk.internal.settings_static import SettingsStatic
50
+ from wandb.sdk.lib import (
51
+ config_util,
52
+ filenames,
53
+ filesystem,
54
+ printer,
55
+ proto_util,
56
+ redirect,
57
+ telemetry,
58
+ tracelog,
59
+ )
60
+ from wandb.sdk.lib.mailbox import ContextCancelledError
61
+ from wandb.sdk.lib.proto_util import message_to_dict
62
+
63
+ if sys.version_info >= (3, 8):
64
+ from typing import Literal
65
+ else:
66
+ from typing_extensions import Literal
67
+
68
+ if TYPE_CHECKING:
69
+ from wandb.proto.wandb_internal_pb2 import (
70
+ ArtifactManifest,
71
+ ArtifactManifestEntry,
72
+ ArtifactRecord,
73
+ HttpResponse,
74
+ LocalInfo,
75
+ Record,
76
+ Result,
77
+ RunExitResult,
78
+ RunRecord,
79
+ SummaryRecord,
80
+ )
81
+
82
+ StreamLiterals = Literal["stdout", "stderr"]
83
+
84
+
85
+ logger = logging.getLogger(__name__)
86
+
87
+
88
+ _OUTPUT_MIN_CALLBACK_INTERVAL = 2 # seconds
89
+
90
+
91
+ def _framework_priority() -> Generator[Tuple[str, str], None, None]:
92
+ yield from [
93
+ ("lightgbm", "lightgbm"),
94
+ ("catboost", "catboost"),
95
+ ("xgboost", "xgboost"),
96
+ ("transformers_huggingface", "huggingface"), # backwards compatibility
97
+ ("transformers", "huggingface"),
98
+ ("pytorch_ignite", "ignite"), # backwards compatibility
99
+ ("ignite", "ignite"),
100
+ ("pytorch_lightning", "lightning"),
101
+ ("fastai", "fastai"),
102
+ ("torch", "torch"),
103
+ ("keras", "keras"),
104
+ ("tensorflow", "tensorflow"),
105
+ ("sklearn", "sklearn"),
106
+ ]
107
+
108
+
109
+ def _manifest_json_from_proto(manifest: "ArtifactManifest") -> Dict:
110
+ if manifest.version == 1:
111
+ if manifest.manifest_file_path:
112
+ contents = {}
113
+ with gzip.open(manifest.manifest_file_path, "rt") as f:
114
+ for line in f:
115
+ entry_json = json.loads(line)
116
+ path = entry_json.pop("path")
117
+ contents[path] = entry_json
118
+ else:
119
+ contents = {
120
+ content.path: _manifest_entry_from_proto(content)
121
+ for content in manifest.contents
122
+ }
123
+ else:
124
+ raise ValueError(f"unknown artifact manifest version: {manifest.version}")
125
+
126
+ return {
127
+ "version": manifest.version,
128
+ "storagePolicy": manifest.storage_policy,
129
+ "storagePolicyConfig": {
130
+ config.key: json.loads(config.value_json)
131
+ for config in manifest.storage_policy_config
132
+ },
133
+ "contents": contents,
134
+ }
135
+
136
+
137
+ def _manifest_entry_from_proto(entry: "ArtifactManifestEntry") -> Dict:
138
+ birth_artifact_id = entry.birth_artifact_id if entry.birth_artifact_id else None
139
+ return {
140
+ "digest": entry.digest,
141
+ "birthArtifactID": birth_artifact_id,
142
+ "ref": entry.ref if entry.ref else None,
143
+ "size": entry.size if entry.size is not None else None,
144
+ "local_path": entry.local_path if entry.local_path else None,
145
+ "skip_cache": entry.skip_cache,
146
+ "extra": {extra.key: json.loads(extra.value_json) for extra in entry.extra},
147
+ }
148
+
149
+
150
+ class ResumeState:
151
+ resumed: bool
152
+ step: int
153
+ history: int
154
+ events: int
155
+ output: int
156
+ runtime: float
157
+ wandb_runtime: Optional[int]
158
+ summary: Optional[Dict[str, Any]]
159
+ config: Optional[Dict[str, Any]]
160
+ tags: Optional[List[str]]
161
+
162
+ def __init__(self) -> None:
163
+ self.resumed = False
164
+ self.step = 0
165
+ self.history = 0
166
+ self.events = 0
167
+ self.output = 0
168
+ self.runtime = 0
169
+ # wandb_runtime is the canonical runtime (stored in summary._wandb.runtime)
170
+ self.wandb_runtime = None
171
+ self.summary = None
172
+ self.config = None
173
+ self.tags = None
174
+
175
+ def __str__(self) -> str:
176
+ obj = ",".join(map(lambda it: f"{it[0]}={it[1]}", vars(self).items()))
177
+ return f"ResumeState({obj})"
178
+
179
+
180
+ class _OutputRawStream:
181
+ _stopped: threading.Event
182
+ _queue: queue.Queue
183
+ _emulator: redirect.TerminalEmulator
184
+ _writer_thr: threading.Thread
185
+ _reader_thr: threading.Thread
186
+
187
+ def __init__(self, stream: str, sm: "SendManager"):
188
+ self._stopped = threading.Event()
189
+ self._queue = queue.Queue()
190
+ self._emulator = redirect.TerminalEmulator()
191
+ self._writer_thr = threading.Thread(
192
+ target=sm._output_raw_writer_thread,
193
+ kwargs=dict(stream=stream),
194
+ daemon=True,
195
+ name=f"OutRawWr-{stream}",
196
+ )
197
+ self._reader_thr = threading.Thread(
198
+ target=sm._output_raw_reader_thread,
199
+ kwargs=dict(stream=stream),
200
+ daemon=True,
201
+ name=f"OutRawRd-{stream}",
202
+ )
203
+
204
+ def start(self) -> None:
205
+ self._writer_thr.start()
206
+ self._reader_thr.start()
207
+
208
+
209
+ class SendManager:
210
+ UPDATE_CONFIG_TIME: int = 30
211
+ UPDATE_STATUS_TIME: int = 5
212
+
213
+ _settings: SettingsStatic
214
+ _record_q: "Queue[Record]"
215
+ _result_q: "Queue[Result]"
216
+ _interface: InterfaceQueue
217
+ _api_settings: Dict[str, str]
218
+ _partial_output: Dict[str, str]
219
+ _context_keeper: context.ContextKeeper
220
+
221
+ _telemetry_obj: telemetry.TelemetryRecord
222
+ _fs: Optional["file_stream.FileStreamApi"]
223
+ _run: Optional["RunRecord"]
224
+ _entity: Optional[str]
225
+ _project: Optional[str]
226
+ _dir_watcher: Optional["DirWatcher"]
227
+ _pusher: Optional["FilePusher"]
228
+ _record_exit: Optional["Record"]
229
+ _exit_result: Optional["RunExitResult"]
230
+ _resume_state: ResumeState
231
+ _rewind_response: Optional[Dict[str, Any]]
232
+ _cached_server_info: Dict[str, Any]
233
+ _cached_viewer: Dict[str, Any]
234
+ _server_messages: List[Dict[str, Any]]
235
+ _ds: Optional[datastore.DataStore]
236
+ _output_raw_streams: Dict["StreamLiterals", _OutputRawStream]
237
+ _output_raw_file: Optional[filesystem.CRDedupedFile]
238
+ _send_record_num: int
239
+ _send_end_offset: int
240
+ _debounce_config_time: float
241
+ _debounce_status_time: float
242
+
243
+ def __init__(
244
+ self,
245
+ settings: SettingsStatic,
246
+ record_q: "Queue[Record]",
247
+ result_q: "Queue[Result]",
248
+ interface: InterfaceQueue,
249
+ context_keeper: context.ContextKeeper,
250
+ ) -> None:
251
+ self._settings = settings
252
+ self._record_q = record_q
253
+ self._result_q = result_q
254
+ self._interface = interface
255
+ self._context_keeper = context_keeper
256
+
257
+ self._ds = None
258
+ self._send_record_num = 0
259
+ self._send_end_offset = 0
260
+
261
+ self._fs = None
262
+ self._pusher = None
263
+ self._dir_watcher = None
264
+
265
+ # State updated by login
266
+ self._entity = None
267
+ self._flags = None
268
+
269
+ # State updated by wandb.init
270
+ self._run = None
271
+ self._project = None
272
+
273
+ # keep track of config from key/val updates
274
+ self._consolidated_config = sender_config.ConfigState()
275
+
276
+ self._start_time: int = 0
277
+ self._telemetry_obj = telemetry.TelemetryRecord()
278
+ self._config_metric_pbdict_list: List[Dict[int, Any]] = []
279
+ self._metadata_summary: Dict[str, Any] = defaultdict()
280
+ self._cached_summary: Dict[str, Any] = dict()
281
+ self._config_metric_index_dict: Dict[str, int] = {}
282
+ self._config_metric_dict: Dict[str, wandb_internal_pb2.MetricRecord] = {}
283
+ self._consolidated_summary: Dict[str, Any] = dict()
284
+
285
+ self._cached_server_info = dict()
286
+ self._cached_viewer = dict()
287
+ self._server_messages = []
288
+
289
+ # State updated by resuming
290
+ self._resume_state = ResumeState()
291
+ self._rewind_response = None
292
+
293
+ # State added when run_exit is initiated and complete
294
+ self._record_exit = None
295
+ self._exit_result = None
296
+
297
+ self._api = internal_api.Api(
298
+ default_settings=settings, retry_callback=self.retry_callback
299
+ )
300
+ self._api_settings = dict()
301
+
302
+ # queue filled by retry_callback
303
+ self._retry_q: Queue[HttpResponse] = queue.Queue()
304
+
305
+ # do we need to debounce?
306
+ self._config_needs_debounce: bool = False
307
+
308
+ # TODO(jhr): do something better, why do we need to send full lines?
309
+ self._partial_output = dict()
310
+
311
+ self._exit_code = 0
312
+
313
+ # internal vars for handing raw console output
314
+ self._output_raw_streams = dict()
315
+ self._output_raw_file = None
316
+
317
+ # job builder
318
+ self._job_builder = JobBuilder(settings)
319
+
320
+ time_now = time.monotonic()
321
+ self._debounce_config_time = time_now
322
+ self._debounce_status_time = time_now
323
+
324
+ @classmethod
325
+ def setup(
326
+ cls,
327
+ root_dir: str,
328
+ resume: Union[None, bool, str],
329
+ ) -> "SendManager":
330
+ """Set up a standalone SendManager.
331
+
332
+ Currently, we're using this primarily for `sync.py`.
333
+ """
334
+ files_dir = os.path.join(root_dir, "files")
335
+ settings = wandb.Settings(
336
+ files_dir=files_dir,
337
+ root_dir=root_dir,
338
+ # _start_time=0,
339
+ resume=resume,
340
+ # ignore_globs=(),
341
+ _sync=True,
342
+ disable_job_creation=False,
343
+ _file_stream_timeout_seconds=0,
344
+ )
345
+ record_q: Queue[Record] = queue.Queue()
346
+ result_q: Queue[Result] = queue.Queue()
347
+ publish_interface = InterfaceQueue(record_q=record_q)
348
+ context_keeper = context.ContextKeeper()
349
+ return SendManager(
350
+ settings=SettingsStatic(settings.to_proto()),
351
+ record_q=record_q,
352
+ result_q=result_q,
353
+ interface=publish_interface,
354
+ context_keeper=context_keeper,
355
+ )
356
+
357
+ def __len__(self) -> int:
358
+ return self._record_q.qsize()
359
+
360
+ def __enter__(self) -> "SendManager":
361
+ return self
362
+
363
+ def __exit__(
364
+ self,
365
+ exc_type: Optional[Type[BaseException]],
366
+ exc_value: Optional[BaseException],
367
+ exc_traceback: Optional[traceback.TracebackException],
368
+ ) -> Literal[False]:
369
+ while self:
370
+ data = next(self)
371
+ self.send(data)
372
+ self.finish()
373
+ return False
374
+
375
+ def retry_callback(self, status: int, response_text: str) -> None:
376
+ response = wandb_internal_pb2.HttpResponse()
377
+ response.http_status_code = status
378
+ response.http_response_text = response_text
379
+ self._retry_q.put(response)
380
+
381
+ def send(self, record: "Record") -> None:
382
+ self._update_record_num(record.num)
383
+ self._update_end_offset(record.control.end_offset)
384
+
385
+ record_type = record.WhichOneof("record_type")
386
+ assert record_type
387
+ handler_str = "send_" + record_type
388
+ send_handler = getattr(self, handler_str, None)
389
+ # Don't log output to reduce log noise
390
+ if record_type not in {"output", "request", "output_raw"}:
391
+ logger.debug(f"send: {record_type}")
392
+ assert send_handler, f"unknown send handler: {handler_str}"
393
+
394
+ context_id = context.context_id_from_record(record)
395
+ api_context = self._context_keeper.get(context_id)
396
+ try:
397
+ self._api.set_local_context(api_context)
398
+ send_handler(record)
399
+ except ContextCancelledError:
400
+ logger.debug(f"Record cancelled: {record_type}")
401
+ self._context_keeper.release(context_id)
402
+ finally:
403
+ self._api.clear_local_context()
404
+
405
+ def send_preempting(self, _: "Record") -> None:
406
+ if self._fs:
407
+ self._fs.enqueue_preempting()
408
+
409
+ def send_request_sender_mark(self, _: "Record") -> None:
410
+ self._maybe_report_status(always=True)
411
+
412
+ def send_request(self, record: "Record") -> None:
413
+ request_type = record.request.WhichOneof("request_type")
414
+ assert request_type
415
+ handler_str = "send_request_" + request_type
416
+ send_handler = getattr(self, handler_str, None)
417
+ if request_type != "network_status":
418
+ logger.debug(f"send_request: {request_type}")
419
+ assert send_handler, f"unknown handle: {handler_str}"
420
+ send_handler(record)
421
+
422
+ def _respond_result(self, result: "Result") -> None:
423
+ tracelog.log_message_queue(result, self._result_q)
424
+ context_id = context.context_id_from_result(result)
425
+ self._context_keeper.release(context_id)
426
+ self._result_q.put(result)
427
+
428
+ def _flatten(self, dictionary: Dict) -> None:
429
+ if isinstance(dictionary, dict):
430
+ for k, v in list(dictionary.items()):
431
+ if isinstance(v, dict):
432
+ self._flatten(v)
433
+ dictionary.pop(k)
434
+ for k2, v2 in v.items():
435
+ dictionary[k + "." + k2] = v2
436
+
437
+ def _update_record_num(self, record_num: int) -> None:
438
+ if not record_num:
439
+ return
440
+ # Currently how we handle offline mode and syncing is not
441
+ # compatible with this assertion due to how the exit record
442
+ # is (mis)handled:
443
+ # - using "always_send" in offline mode to trigger defer
444
+ # state machine
445
+ # - skipping the exit record in `wandb sync` mode so that
446
+ # it is always executed as the last record
447
+ if not self._settings._offline and not self._settings._sync:
448
+ assert record_num == self._send_record_num + 1
449
+ self._send_record_num = record_num
450
+
451
+ def _update_end_offset(self, end_offset: int) -> None:
452
+ if not end_offset:
453
+ return
454
+ self._send_end_offset = end_offset
455
+
456
+ def send_request_sender_read(self, record: "Record") -> None:
457
+ if self._ds is None:
458
+ self._ds = datastore.DataStore()
459
+ self._ds.open_for_scan(self._settings.sync_file)
460
+
461
+ # TODO(cancel_paused): implement cancel_set logic
462
+ # The idea is that there is an active request to cancel a
463
+ # message that is being read from the transaction log below
464
+
465
+ start_offset = record.request.sender_read.start_offset
466
+ final_offset = record.request.sender_read.final_offset
467
+ self._ds.seek(start_offset)
468
+
469
+ current_end_offset = 0
470
+ while current_end_offset < final_offset:
471
+ data = self._ds.scan_data()
472
+ assert data
473
+ current_end_offset = self._ds.get_offset()
474
+
475
+ send_record = wandb_internal_pb2.Record()
476
+ send_record.ParseFromString(data)
477
+ self._update_end_offset(current_end_offset)
478
+ self.send(send_record)
479
+
480
+ # make sure we perform deferred operations
481
+ self.debounce()
482
+
483
+ # make sure that we always update writer for every sended read request
484
+ self._maybe_report_status(always=True)
485
+
486
+ def send_request_check_version(self, record: "Record") -> None:
487
+ assert record.control.req_resp or record.control.mailbox_slot
488
+ result = proto_util._result_from_record(record)
489
+ current_version = (
490
+ record.request.check_version.current_version or wandb.__version__
491
+ )
492
+ messages = update.check_available(current_version)
493
+ if messages:
494
+ upgrade_message = messages.get("upgrade_message")
495
+ if upgrade_message:
496
+ result.response.check_version_response.upgrade_message = upgrade_message
497
+ yank_message = messages.get("yank_message")
498
+ if yank_message:
499
+ result.response.check_version_response.yank_message = yank_message
500
+ delete_message = messages.get("delete_message")
501
+ if delete_message:
502
+ result.response.check_version_response.delete_message = delete_message
503
+ self._respond_result(result)
504
+
505
+ def send_request_stop_status(self, record: "Record") -> None:
506
+ result = proto_util._result_from_record(record)
507
+ status_resp = result.response.stop_status_response
508
+ status_resp.run_should_stop = False
509
+ if self._entity and self._project and self._run and self._run.run_id:
510
+ try:
511
+ status_resp.run_should_stop = self._api.check_stop_requested(
512
+ self._project, self._entity, self._run.run_id
513
+ )
514
+ except Exception as e:
515
+ logger.warning("Failed to check stop requested status: %s", e)
516
+ self._respond_result(result)
517
+
518
+ def _maybe_update_config(self, always: bool = False) -> None:
519
+ time_now = time.monotonic()
520
+ if (
521
+ not always
522
+ and time_now < self._debounce_config_time + self.UPDATE_CONFIG_TIME
523
+ ):
524
+ return
525
+ if self._config_needs_debounce:
526
+ self._debounce_config()
527
+ self._debounce_config_time = time_now
528
+
529
+ def _maybe_report_status(self, always: bool = False) -> None:
530
+ time_now = time.monotonic()
531
+ if (
532
+ not always
533
+ and time_now < self._debounce_status_time + self.UPDATE_STATUS_TIME
534
+ ):
535
+ return
536
+ self._debounce_status_time = time_now
537
+
538
+ status_report = wandb_internal_pb2.StatusReportRequest(
539
+ record_num=self._send_record_num,
540
+ sent_offset=self._send_end_offset,
541
+ )
542
+ status_time = time.time()
543
+ status_report.sync_time.FromMicroseconds(int(status_time * 1e6))
544
+ record = self._interface._make_request(status_report=status_report)
545
+ self._interface._publish(record)
546
+
547
+ def debounce(self, final: bool = False) -> None:
548
+ self._maybe_report_status(always=final)
549
+ self._maybe_update_config(always=final)
550
+
551
+ def _debounce_config(self) -> None:
552
+ config_value_dict = self._config_backend_dict()
553
+ # TODO(jhr): check result of upsert_run?
554
+ if self._run:
555
+ self._api.upsert_run(
556
+ name=self._run.run_id,
557
+ config=config_value_dict,
558
+ **self._api_settings, # type: ignore
559
+ )
560
+ self._config_save(config_value_dict)
561
+ self._config_needs_debounce = False
562
+
563
+ def send_request_network_status(self, record: "Record") -> None:
564
+ result = proto_util._result_from_record(record)
565
+ status_resp = result.response.network_status_response
566
+ while True:
567
+ try:
568
+ status_resp.network_responses.append(self._retry_q.get_nowait())
569
+ except queue.Empty:
570
+ break
571
+ except Exception as e:
572
+ logger.warning(f"Error emptying retry queue: {e}")
573
+ self._respond_result(result)
574
+
575
+ def send_request_login(self, record: "Record") -> None:
576
+ # TODO: do something with api_key or anonymous?
577
+ # TODO: return an error if we aren't logged in?
578
+ self._api.reauth()
579
+ viewer = self.get_viewer_info()
580
+ server_info = self.get_server_info()
581
+ # self._login_flags = json.loads(viewer.get("flags", "{}"))
582
+ # self._login_entity = viewer.get("entity")
583
+ if server_info:
584
+ logger.info(f"Login server info: {server_info}")
585
+ self._entity = viewer.get("entity")
586
+ if record.control.req_resp:
587
+ result = proto_util._result_from_record(record)
588
+ if self._entity:
589
+ result.response.login_response.active_entity = self._entity
590
+ self._respond_result(result)
591
+
592
+ def send_exit(self, record: "Record") -> None:
593
+ # track where the exit came from
594
+ self._record_exit = record
595
+
596
+ run_exit = record.exit
597
+ self._exit_code = run_exit.exit_code
598
+ logger.info("handling exit code: %s", run_exit.exit_code)
599
+ runtime = run_exit.runtime
600
+ logger.info("handling runtime: %s", run_exit.runtime)
601
+ self._metadata_summary["runtime"] = runtime
602
+ self._update_summary()
603
+
604
+ # We need to give the request queue a chance to empty between states
605
+ # so use handle_request_defer as a state machine.
606
+ logger.info("send defer")
607
+ self._interface.publish_defer()
608
+
609
+ def send_final(self, record: "Record") -> None:
610
+ pass
611
+
612
+ def _flush_run(self) -> None:
613
+ pass
614
+
615
+ def send_request_status_report(self, record: "Record") -> None:
616
+ # todo? this is just a noop to please wandb sync
617
+ pass
618
+
619
+ def send_request_defer(self, record: "Record") -> None: # noqa: C901
620
+ defer = record.request.defer
621
+ state = defer.state
622
+ logger.info(f"handle sender defer: {state}")
623
+
624
+ def transition_state() -> None:
625
+ state = defer.state + 1
626
+ logger.info(f"send defer: {state}")
627
+ self._interface.publish_defer(state)
628
+
629
+ done = False
630
+ if state == defer.BEGIN:
631
+ transition_state()
632
+ elif state == defer.FLUSH_RUN:
633
+ self._flush_run()
634
+ transition_state()
635
+ elif state == defer.FLUSH_STATS:
636
+ # NOTE: this is handled in handler.py:handle_request_defer()
637
+ transition_state()
638
+ elif state == defer.FLUSH_PARTIAL_HISTORY:
639
+ # NOTE: this is handled in handler.py:handle_request_defer()
640
+ transition_state()
641
+ elif state == defer.FLUSH_TB:
642
+ # NOTE: this is handled in handler.py:handle_request_defer()
643
+ transition_state()
644
+ elif state == defer.FLUSH_SUM:
645
+ # NOTE: this is handled in handler.py:handle_request_defer()
646
+ transition_state()
647
+ elif state == defer.FLUSH_DEBOUNCER:
648
+ self.debounce(final=True)
649
+ transition_state()
650
+ elif state == defer.FLUSH_OUTPUT:
651
+ self._output_raw_finish()
652
+ transition_state()
653
+ elif state == defer.FLUSH_JOB:
654
+ self._flush_job()
655
+ transition_state()
656
+ elif state == defer.FLUSH_DIR:
657
+ if self._dir_watcher:
658
+ self._dir_watcher.finish()
659
+ self._dir_watcher = None
660
+ transition_state()
661
+ elif state == defer.FLUSH_FP:
662
+ if self._pusher:
663
+ # FilePusher generates some events for FileStreamApi, so we
664
+ # need to wait for pusher to finish before going to the next
665
+ # state to ensure that filestream gets all the events that we
666
+ # want before telling it to finish up
667
+ self._pusher.finish(transition_state)
668
+ else:
669
+ transition_state()
670
+ elif state == defer.JOIN_FP:
671
+ if self._pusher:
672
+ self._pusher.join()
673
+ transition_state()
674
+ elif state == defer.FLUSH_FS:
675
+ if self._fs:
676
+ # TODO(jhr): now is a good time to output pending output lines
677
+ self._fs.finish(self._exit_code)
678
+ self._fs = None
679
+ transition_state()
680
+ elif state == defer.FLUSH_FINAL:
681
+ self._interface.publish_final()
682
+ self._interface.publish_footer()
683
+ transition_state()
684
+ elif state == defer.END:
685
+ done = True
686
+ else:
687
+ raise AssertionError("unknown state")
688
+
689
+ if not done:
690
+ return
691
+
692
+ exit_result = wandb_internal_pb2.RunExitResult()
693
+
694
+ # mark exit done in case we are polling on exit
695
+ self._exit_result = exit_result
696
+
697
+ # Report response to mailbox
698
+ if self._record_exit and self._record_exit.control.mailbox_slot:
699
+ result = proto_util._result_from_record(self._record_exit)
700
+ result.exit_result.CopyFrom(exit_result)
701
+ self._respond_result(result)
702
+
703
+ def send_request_poll_exit(self, record: "Record") -> None:
704
+ if not record.control.req_resp and not record.control.mailbox_slot:
705
+ return
706
+
707
+ result = proto_util._result_from_record(record)
708
+
709
+ if self._pusher:
710
+ _alive, status = self._pusher.get_status()
711
+ file_counts = self._pusher.file_counts_by_category()
712
+ resp = result.response.poll_exit_response
713
+ resp.pusher_stats.uploaded_bytes = status.uploaded_bytes
714
+ resp.pusher_stats.total_bytes = status.total_bytes
715
+ resp.pusher_stats.deduped_bytes = status.deduped_bytes
716
+ resp.file_counts.wandb_count = file_counts.wandb
717
+ resp.file_counts.media_count = file_counts.media
718
+ resp.file_counts.artifact_count = file_counts.artifact
719
+ resp.file_counts.other_count = file_counts.other
720
+
721
+ if self._exit_result:
722
+ result.response.poll_exit_response.done = True
723
+ result.response.poll_exit_response.exit_result.CopyFrom(self._exit_result)
724
+
725
+ self._respond_result(result)
726
+
727
+ def send_request_server_info(self, record: "Record") -> None:
728
+ assert record.control.req_resp or record.control.mailbox_slot
729
+ result = proto_util._result_from_record(record)
730
+
731
+ result.response.server_info_response.local_info.CopyFrom(self.get_local_info())
732
+ for message in self._server_messages:
733
+ # guard against the case the message level returns malformed from server
734
+ message_level = str(message.get("messageLevel"))
735
+ message_level_sanitized = int(
736
+ printer.INFO if not message_level.isdigit() else message_level
737
+ )
738
+ result.response.server_info_response.server_messages.item.append(
739
+ wandb_internal_pb2.ServerMessage(
740
+ utf_text=message.get("utfText", ""),
741
+ plain_text=message.get("plainText", ""),
742
+ html_text=message.get("htmlText", ""),
743
+ type=message.get("messageType", ""),
744
+ level=message_level_sanitized,
745
+ )
746
+ )
747
+ self._respond_result(result)
748
+
749
+ def _setup_resume(
750
+ self, run: "RunRecord"
751
+ ) -> Optional["wandb_internal_pb2.ErrorInfo"]:
752
+ """Queries the backend for a run; fail if the settings are incompatible."""
753
+ if not self._settings.resume:
754
+ return None
755
+
756
+ # TODO: This causes a race, we need to make the upsert atomically
757
+ # only create or update depending on the resume config
758
+ # we use the runs entity if set, otherwise fallback to users entity
759
+ # todo: ensure entity is not None as self._entity is Optional[str]
760
+ entity = run.entity or self._entity
761
+ logger.info(
762
+ "checking resume status for %s/%s/%s", entity, run.project, run.run_id
763
+ )
764
+ resume_status = self._api.run_resume_status(
765
+ entity=entity, # type: ignore
766
+ project_name=run.project,
767
+ name=run.run_id,
768
+ )
769
+ # No resume status = run does not exist; No t key in wandbConfig = run exists but hasn't been inited
770
+ if not resume_status or '"t":' not in resume_status.get("wandbConfig", ""):
771
+ if self._settings.resume == "must":
772
+ error = wandb_internal_pb2.ErrorInfo()
773
+ error.code = wandb_internal_pb2.ErrorInfo.ErrorCode.USAGE
774
+ error.message = (
775
+ "You provided an invalid value for the `resume` argument."
776
+ f" The value 'must' is not a valid option for resuming a run ({run.run_id}) that has not been initialized."
777
+ " Please check your inputs and try again with a valid run ID."
778
+ " If you are trying to start a new run, please omit the `resume` argument or use `resume='allow'`."
779
+ )
780
+ return error
781
+ return None
782
+
783
+ #
784
+ # handle cases where we have resume_status
785
+ #
786
+ if self._settings.resume == "never":
787
+ error = wandb_internal_pb2.ErrorInfo()
788
+ error.code = wandb_internal_pb2.ErrorInfo.ErrorCode.USAGE
789
+ error.message = (
790
+ "You provided an invalid value for the `resume` argument."
791
+ f" The value 'never' is not a valid option for resuming a run ({run.run_id}) that already exists."
792
+ " Please check your inputs and try again with a valid value for the `resume` argument."
793
+ )
794
+ return error
795
+
796
+ history = {}
797
+ events = {}
798
+ config = {}
799
+ summary = {}
800
+ try:
801
+ events_rt = 0
802
+ history_rt = 0
803
+ history = json.loads(resume_status["historyTail"])
804
+ if history:
805
+ history = json.loads(history[-1])
806
+ history_rt = history.get("_runtime", 0)
807
+ events = json.loads(resume_status["eventsTail"])
808
+ if events:
809
+ events = json.loads(events[-1])
810
+ events_rt = events.get("_runtime", 0)
811
+ config = json.loads(resume_status["config"] or "{}")
812
+ summary = json.loads(resume_status["summaryMetrics"] or "{}")
813
+ new_runtime = summary.get("_wandb", {}).get("runtime", None)
814
+ if new_runtime is not None:
815
+ self._resume_state.wandb_runtime = new_runtime
816
+ tags = resume_status.get("tags") or []
817
+
818
+ except (IndexError, ValueError) as e:
819
+ logger.error("unable to load resume tails", exc_info=e)
820
+ if self._settings.resume == "must":
821
+ error = wandb_internal_pb2.ErrorInfo()
822
+ error.code = wandb_internal_pb2.ErrorInfo.ErrorCode.USAGE
823
+ error.message = "resume='must' but could not resume ({}) ".format(
824
+ run.run_id
825
+ )
826
+ return error
827
+
828
+ # TODO: Do we need to restore config / summary?
829
+ # System metrics runtime is usually greater than history
830
+ self._resume_state.runtime = max(events_rt, history_rt)
831
+ last_step = history.get("_step", 0)
832
+ history_line_count = resume_status["historyLineCount"]
833
+ self._resume_state.step = last_step + 1 if history_line_count > 0 else last_step
834
+ self._resume_state.history = history_line_count
835
+ self._resume_state.events = resume_status["eventsLineCount"]
836
+ self._resume_state.output = resume_status["logLineCount"]
837
+ self._resume_state.config = config
838
+ self._resume_state.summary = summary
839
+ self._resume_state.tags = tags
840
+ self._resume_state.resumed = True
841
+ logger.info("configured resuming with: {}".format(self._resume_state))
842
+ return None
843
+
844
+ def _telemetry_get_framework(self) -> str:
845
+ """Get telemetry data for internal config structure."""
846
+ # detect framework by checking what is loaded
847
+ imports: telemetry.TelemetryImports
848
+ if self._telemetry_obj.HasField("imports_finish"):
849
+ imports = self._telemetry_obj.imports_finish
850
+ elif self._telemetry_obj.HasField("imports_init"):
851
+ imports = self._telemetry_obj.imports_init
852
+ else:
853
+ return ""
854
+ framework = next(
855
+ (n for f, n in _framework_priority() if getattr(imports, f, False)), ""
856
+ )
857
+ return framework
858
+
859
+ def _config_backend_dict(self) -> sender_config.BackendConfigDict:
860
+ config = self._consolidated_config or sender_config.ConfigState()
861
+
862
+ return config.to_backend_dict(
863
+ telemetry_record=self._telemetry_obj,
864
+ framework=self._telemetry_get_framework(),
865
+ start_time_millis=self._start_time,
866
+ metric_pbdicts=self._config_metric_pbdict_list,
867
+ )
868
+
869
+ def _config_save(
870
+ self,
871
+ config_value_dict: sender_config.BackendConfigDict,
872
+ ) -> None:
873
+ config_path = os.path.join(self._settings.files_dir, "config.yaml")
874
+ config_util.save_config_file_from_dict(config_path, config_value_dict)
875
+
876
+ def _sync_spell(self) -> None:
877
+ """Sync this run with spell."""
878
+ if not self._run:
879
+ return
880
+ try:
881
+ env = os.environ
882
+ self._interface.publish_config(
883
+ key=("_wandb", "spell_url"), val=env.get("SPELL_RUN_URL")
884
+ )
885
+ url = "{}/{}/{}/runs/{}".format(
886
+ self._api.app_url, self._run.entity, self._run.project, self._run.run_id
887
+ )
888
+ requests.put(
889
+ env.get("SPELL_API_URL", "https://api.spell.run") + "/wandb_url",
890
+ json={"access_token": env.get("WANDB_ACCESS_TOKEN"), "url": url},
891
+ timeout=2,
892
+ )
893
+ except requests.RequestException:
894
+ pass
895
+ # TODO: do something if sync spell is not successful?
896
+
897
+ def _setup_fork(self, server_run: dict):
898
+ assert self._settings.fork_from
899
+ assert self._settings.fork_from.metric == "_step"
900
+ assert self._run
901
+ first_step = int(self._settings.fork_from.value) + 1
902
+ self._resume_state.step = first_step
903
+ self._resume_state.history = server_run.get("historyLineCount", 0)
904
+ self._run.forked = True
905
+ self._run.starting_step = first_step
906
+
907
+ def _load_rewind_state(self, run: "RunRecord"):
908
+ assert self._settings.resume_from
909
+ self._rewind_response = self._api.rewind_run(
910
+ run_name=run.run_id,
911
+ entity=run.entity or None,
912
+ project=run.project or None,
913
+ metric_name=self._settings.resume_from.metric,
914
+ metric_value=self._settings.resume_from.value,
915
+ program_path=self._settings.program or None,
916
+ )
917
+ self._resume_state.history = self._rewind_response.get("historyLineCount", 0)
918
+ self._resume_state.config = json.loads(
919
+ self._rewind_response.get("config", "{}")
920
+ )
921
+
922
+ def _install_rewind_state(self):
923
+ assert self._settings.resume_from
924
+ assert self._settings.resume_from.metric == "_step"
925
+ assert self._run
926
+ assert self._rewind_response
927
+
928
+ first_step = int(self._settings.resume_from.value) + 1
929
+ self._resume_state.step = first_step
930
+
931
+ # We set the fork flag here because rewind uses the forking
932
+ # infrastructure under the hood. Setting `forked` here
933
+ # ensures that run._step is properly set in the user process.
934
+ self._run.forked = True
935
+ self._run.starting_step = first_step
936
+
937
+ def _handle_error(
938
+ self,
939
+ record: "Record",
940
+ error: "wandb_internal_pb2.ErrorInfo",
941
+ run: "RunRecord",
942
+ ) -> None:
943
+ if record.control.req_resp or record.control.mailbox_slot:
944
+ result = proto_util._result_from_record(record)
945
+ result.run_result.run.CopyFrom(run)
946
+ result.run_result.error.CopyFrom(error)
947
+ self._respond_result(result)
948
+ else:
949
+ logger.error("Got error in async mode: %s", error.message)
950
+
951
+ def send_run(self, record: "Record", file_dir: Optional[str] = None) -> None:
952
+ run = record.run
953
+ error = None
954
+ is_wandb_init = self._run is None
955
+
956
+ # save start time of a run
957
+ self._start_time = int(run.start_time.ToMicroseconds() // 1e6)
958
+
959
+ # update telemetry
960
+ if run.telemetry:
961
+ self._telemetry_obj.MergeFrom(run.telemetry)
962
+ if self._settings._sync:
963
+ self._telemetry_obj.feature.sync = True
964
+
965
+ # build config dict
966
+ config_value_dict: Optional[sender_config.BackendConfigDict] = None
967
+ if run.config:
968
+ self._consolidated_config.update_from_proto(run.config)
969
+ config_value_dict = self._config_backend_dict()
970
+ self._config_save(config_value_dict)
971
+
972
+ do_fork = self._settings.fork_from is not None and is_wandb_init
973
+ do_rewind = self._settings.resume_from is not None and is_wandb_init
974
+ do_resume = bool(self._settings.resume)
975
+
976
+ num_resume_options_set = sum([do_fork, do_rewind, do_resume])
977
+ if num_resume_options_set > 1:
978
+ error = wandb_internal_pb2.ErrorInfo()
979
+ error.code = wandb_internal_pb2.ErrorInfo.ErrorCode.USAGE
980
+ error.message = (
981
+ "Multiple resume options specified. "
982
+ "Please specify only one of `fork_from`, `resume`, or `resume_from`."
983
+ )
984
+ self._handle_error(record, error, run)
985
+
986
+ if is_wandb_init:
987
+ # Ensure we have a project to query for status
988
+ if run.project == "":
989
+ run.project = util.auto_project_name(self._settings.program)
990
+ # Only check resume status on `wandb.init`
991
+
992
+ if do_resume:
993
+ error = self._setup_resume(run)
994
+
995
+ elif do_rewind:
996
+ error = self._load_rewind_state(run)
997
+
998
+ if error is not None:
999
+ self._handle_error(record, error, run)
1000
+ return
1001
+
1002
+ # Save the resumed config
1003
+ if self._resume_state.config is not None:
1004
+ self._consolidated_config.merge_resumed_config(
1005
+ config_util.dict_strip_value_dict(self._resume_state.config)
1006
+ )
1007
+
1008
+ config_value_dict = self._config_backend_dict()
1009
+ self._config_save(config_value_dict)
1010
+
1011
+ # handle empty config
1012
+ # TODO(jhr): consolidate the 4 ways config is built:
1013
+ # (passed config, empty config, resume config, send_config)
1014
+ if not config_value_dict:
1015
+ config_value_dict = self._config_backend_dict()
1016
+ self._config_save(config_value_dict)
1017
+
1018
+ try:
1019
+ server_run = self._init_run(run, config_value_dict)
1020
+ except (CommError, UsageError) as e:
1021
+ logger.error(e, exc_info=True)
1022
+ error = ProtobufErrorHandler.from_exception(e)
1023
+ self._handle_error(record, error, run)
1024
+ return
1025
+
1026
+ assert self._run # self._run is configured in _init_run()
1027
+
1028
+ if do_fork:
1029
+ error = self._setup_fork(server_run)
1030
+
1031
+ if error is not None:
1032
+ self._handle_error(record, error, run)
1033
+ return
1034
+
1035
+ if record.control.req_resp or record.control.mailbox_slot:
1036
+ result = proto_util._result_from_record(record)
1037
+ # TODO: we could do self._interface.publish_defer(resp) to notify
1038
+ # the handler not to actually perform server updates for this uuid
1039
+ # because the user process will send a summary update when we resume
1040
+ result.run_result.run.CopyFrom(self._run)
1041
+ self._respond_result(result)
1042
+
1043
+ # Only spin up our threads on the first run message
1044
+ if is_wandb_init:
1045
+ self._start_run_threads(file_dir)
1046
+ else:
1047
+ logger.info("updated run: %s", self._run.run_id)
1048
+
1049
+ def _update_resume_state(self, is_rewinding: bool, inserted: bool):
1050
+ assert self._run
1051
+ if self._resume_state.resumed:
1052
+ self._run.resumed = True
1053
+ if self._resume_state.wandb_runtime is not None:
1054
+ self._run.runtime = self._resume_state.wandb_runtime
1055
+ elif is_rewinding:
1056
+ # because is_rewinding is mutually exclusive with self._resume_state.resumed,
1057
+ # this block will always execute if is_rewinding is set
1058
+ self._install_rewind_state()
1059
+ else:
1060
+ # If the user is not resuming, and we didn't insert on upsert_run then
1061
+ # it is likely that we are overwriting the run which we might want to
1062
+ # prevent in the future. This could be a false signal since an upsert_run
1063
+ # message which gets retried in the network could also show up as not
1064
+ # inserted.
1065
+ if not inserted:
1066
+ # no need to flush this, it will get updated eventually
1067
+ self._telemetry_obj.feature.maybe_run_overwrite = True
1068
+
1069
+ def _init_run(
1070
+ self,
1071
+ run: "RunRecord",
1072
+ config_dict: Optional[sender_config.BackendConfigDict],
1073
+ ) -> dict:
1074
+ # We subtract the previous runs runtime when resuming
1075
+ start_time = (
1076
+ run.start_time.ToMicroseconds() / 1e6
1077
+ ) - self._resume_state.runtime
1078
+ # TODO: we don't check inserted currently, ultimately we should make
1079
+ # the upsert know the resume state and fail transactionally
1080
+
1081
+ if self._resume_state and self._resume_state.tags and not run.tags:
1082
+ run.tags.extend(self._resume_state.tags)
1083
+
1084
+ is_rewinding = bool(self._settings.resume_from)
1085
+ if is_rewinding:
1086
+ assert self._rewind_response
1087
+ server_run = self._rewind_response
1088
+ server_messages = None
1089
+ inserted = True
1090
+ else:
1091
+ server_run, inserted, server_messages = self._api.upsert_run(
1092
+ name=run.run_id,
1093
+ entity=run.entity or None,
1094
+ project=run.project or None,
1095
+ group=run.run_group or None,
1096
+ job_type=run.job_type or None,
1097
+ display_name=run.display_name or None,
1098
+ notes=run.notes or None,
1099
+ tags=run.tags[:] or None,
1100
+ config=config_dict or None,
1101
+ sweep_name=run.sweep_id or None,
1102
+ host=run.host or None,
1103
+ program_path=self._settings.program or None,
1104
+ repo=run.git.remote_url or None,
1105
+ commit=run.git.commit or None,
1106
+ )
1107
+
1108
+ # TODO: we don't want to create jobs in sweeps, since the
1109
+ # executable doesn't appear to be consistent
1110
+ if run.sweep_id:
1111
+ self._job_builder.disable = True
1112
+
1113
+ self._server_messages = server_messages or []
1114
+ self._run = run
1115
+
1116
+ if self._resume_state.resumed and is_rewinding:
1117
+ # this should not ever be possible to hit, since we check for
1118
+ # resumption above and raise an error if resumption is specified
1119
+ # twice.
1120
+ raise ValueError(
1121
+ "Cannot attempt to rewind and resume a run - only one of "
1122
+ "`resume` or `resume_from` can be specified."
1123
+ )
1124
+
1125
+ self._update_resume_state(is_rewinding, inserted)
1126
+ self._run.starting_step = self._resume_state.step
1127
+ self._run.start_time.FromMicroseconds(int(start_time * 1e6))
1128
+ self._run.config.CopyFrom(self._interface._make_config(config_dict))
1129
+ if self._resume_state.summary is not None:
1130
+ self._run.summary.CopyFrom(
1131
+ self._interface._make_summary_from_dict(self._resume_state.summary)
1132
+ )
1133
+ storage_id = server_run.get("id")
1134
+ if storage_id:
1135
+ self._run.storage_id = storage_id
1136
+ id = server_run.get("name")
1137
+ if id:
1138
+ self._api.set_current_run_id(id)
1139
+ display_name = server_run.get("displayName")
1140
+ if display_name:
1141
+ self._run.display_name = display_name
1142
+ project = server_run.get("project")
1143
+ # TODO: remove self._api.set_settings, and make self._project a property?
1144
+ if project:
1145
+ project_name = project.get("name")
1146
+ if project_name:
1147
+ self._run.project = project_name
1148
+ self._project = project_name
1149
+ self._api_settings["project"] = project_name
1150
+ self._api.set_setting("project", project_name)
1151
+ entity = project.get("entity")
1152
+ if entity:
1153
+ entity_name = entity.get("name")
1154
+ if entity_name:
1155
+ self._run.entity = entity_name
1156
+ self._entity = entity_name
1157
+ self._api_settings["entity"] = entity_name
1158
+ self._api.set_setting("entity", entity_name)
1159
+ sweep_id = server_run.get("sweepName")
1160
+ if sweep_id:
1161
+ self._run.sweep_id = sweep_id
1162
+ if os.getenv("SPELL_RUN_URL"):
1163
+ self._sync_spell()
1164
+ return server_run
1165
+
1166
+ def _start_run_threads(self, file_dir: Optional[str] = None) -> None:
1167
+ assert self._run # self._run is configured by caller
1168
+ self._fs = file_stream.FileStreamApi(
1169
+ self._api,
1170
+ self._run.run_id,
1171
+ self._run.start_time.ToMicroseconds() / 1e6,
1172
+ timeout=self._settings._file_stream_timeout_seconds,
1173
+ settings=self._api_settings,
1174
+ )
1175
+ # Ensure the streaming polices have the proper offsets
1176
+ self._fs.set_file_policy("wandb-summary.json", file_stream.SummaryFilePolicy())
1177
+ self._fs.set_file_policy(
1178
+ "wandb-history.jsonl",
1179
+ file_stream.JsonlFilePolicy(start_chunk_id=self._resume_state.history),
1180
+ )
1181
+ self._fs.set_file_policy(
1182
+ "wandb-events.jsonl",
1183
+ file_stream.JsonlFilePolicy(start_chunk_id=self._resume_state.events),
1184
+ )
1185
+ self._fs.set_file_policy(
1186
+ "output.log",
1187
+ file_stream.CRDedupeFilePolicy(start_chunk_id=self._resume_state.output),
1188
+ )
1189
+
1190
+ # hack to merge run_settings and self._settings object together
1191
+ # so that fields like entity or project are available to be attached to Sentry events.
1192
+ run_settings = message_to_dict(self._run)
1193
+ _settings = dict(self._settings)
1194
+ _settings.update(run_settings)
1195
+ wandb._sentry.configure_scope(tags=_settings, process_context="internal")
1196
+
1197
+ self._fs.start()
1198
+ self._pusher = FilePusher(self._api, self._fs, settings=self._settings)
1199
+ self._dir_watcher = DirWatcher(self._settings, self._pusher, file_dir)
1200
+ logger.info(
1201
+ "run started: %s with start time %s",
1202
+ self._run.run_id,
1203
+ self._run.start_time.ToMicroseconds() / 1e6,
1204
+ )
1205
+
1206
+ def _save_history(self, history_dict: Dict[str, Any]) -> None:
1207
+ if self._fs:
1208
+ self._fs.push(filenames.HISTORY_FNAME, json.dumps(history_dict))
1209
+
1210
+ def send_history(self, record: "Record") -> None:
1211
+ history = record.history
1212
+ history_dict = proto_util.dict_from_proto_list(history.item)
1213
+ self._save_history(history_dict)
1214
+
1215
+ def _update_summary_record(self, summary: "SummaryRecord") -> None:
1216
+ summary_dict = proto_util.dict_from_proto_list(summary.update)
1217
+ self._cached_summary = summary_dict
1218
+ self._update_summary()
1219
+
1220
+ def send_summary(self, record: "Record") -> None:
1221
+ self._update_summary_record(record.summary)
1222
+
1223
+ def send_request_summary_record(self, record: "Record") -> None:
1224
+ self._update_summary_record(record.request.summary_record.summary)
1225
+
1226
+ def _update_summary(self) -> None:
1227
+ summary_dict = self._cached_summary.copy()
1228
+ summary_dict.pop("_wandb", None)
1229
+ if self._metadata_summary:
1230
+ summary_dict["_wandb"] = self._metadata_summary
1231
+ # merge with consolidated summary
1232
+ self._consolidated_summary.update(summary_dict)
1233
+ json_summary = json.dumps(self._consolidated_summary)
1234
+ if self._fs:
1235
+ self._fs.push(filenames.SUMMARY_FNAME, json_summary)
1236
+ # TODO(jhr): we should only write this at the end of the script
1237
+ summary_path = os.path.join(self._settings.files_dir, filenames.SUMMARY_FNAME)
1238
+ with open(summary_path, "w") as f:
1239
+ f.write(json_summary)
1240
+ self._save_file(interface.GlobStr(filenames.SUMMARY_FNAME))
1241
+
1242
+ def send_stats(self, record: "Record") -> None:
1243
+ stats = record.stats
1244
+ if stats.stats_type != wandb_internal_pb2.StatsRecord.StatsType.SYSTEM:
1245
+ return
1246
+ if not self._fs:
1247
+ return
1248
+ if not self._run:
1249
+ return
1250
+ now_us = stats.timestamp.ToMicroseconds()
1251
+ start_us = self._run.start_time.ToMicroseconds()
1252
+ d = dict()
1253
+ for item in stats.item:
1254
+ d[item.key] = json.loads(item.value_json)
1255
+ row: Dict[str, Any] = dict(system=d)
1256
+ self._flatten(row)
1257
+ row["_wandb"] = True
1258
+ row["_timestamp"] = now_us / 1e6
1259
+ row["_runtime"] = (now_us - start_us) / 1e6
1260
+ self._fs.push(filenames.EVENTS_FNAME, json.dumps(row))
1261
+ # TODO(jhr): check fs.push results?
1262
+
1263
+ def _output_raw_finish(self) -> None:
1264
+ for stream, output_raw in self._output_raw_streams.items():
1265
+ output_raw._stopped.set()
1266
+
1267
+ # shut down threads
1268
+ output_raw._writer_thr.join(timeout=5)
1269
+ if output_raw._writer_thr.is_alive():
1270
+ logger.info("processing output...")
1271
+ output_raw._writer_thr.join()
1272
+ output_raw._reader_thr.join()
1273
+
1274
+ # flush output buffers and files
1275
+ self._output_raw_flush(stream)
1276
+ self._output_raw_streams = {}
1277
+ if self._output_raw_file:
1278
+ self._output_raw_file.close()
1279
+ self._output_raw_file = None
1280
+
1281
+ def _output_raw_writer_thread(self, stream: "StreamLiterals") -> None:
1282
+ while True:
1283
+ output_raw = self._output_raw_streams[stream]
1284
+ if output_raw._queue.empty():
1285
+ if output_raw._stopped.is_set():
1286
+ return
1287
+ time.sleep(0.5)
1288
+ continue
1289
+ data = []
1290
+ while not output_raw._queue.empty():
1291
+ data.append(output_raw._queue.get())
1292
+ if output_raw._stopped.is_set() and sum(map(len, data)) > 100000:
1293
+ logger.warning("Terminal output too large. Logging without processing.")
1294
+ self._output_raw_flush(stream)
1295
+ for line in data:
1296
+ self._output_raw_flush(stream, line)
1297
+ # TODO: lets mark that this happened in telemetry
1298
+ return
1299
+ try:
1300
+ output_raw._emulator.write("".join(data))
1301
+ except Exception as e:
1302
+ logger.warning(f"problem writing to output_raw emulator: {e}")
1303
+
1304
+ def _output_raw_reader_thread(self, stream: "StreamLiterals") -> None:
1305
+ output_raw = self._output_raw_streams[stream]
1306
+ while not (output_raw._stopped.is_set() and output_raw._queue.empty()):
1307
+ self._output_raw_flush(stream)
1308
+ time.sleep(_OUTPUT_MIN_CALLBACK_INTERVAL)
1309
+
1310
+ def _output_raw_flush(
1311
+ self, stream: "StreamLiterals", data: Optional[str] = None
1312
+ ) -> None:
1313
+ if data is None:
1314
+ output_raw = self._output_raw_streams[stream]
1315
+ try:
1316
+ data = output_raw._emulator.read()
1317
+ except Exception as e:
1318
+ logger.warning(f"problem reading from output_raw emulator: {e}")
1319
+ if data:
1320
+ self._send_output_line(stream, data)
1321
+ if self._output_raw_file:
1322
+ self._output_raw_file.write(data.encode("utf-8"))
1323
+
1324
+ def send_request_python_packages(self, record: "Record") -> None:
1325
+ import os
1326
+
1327
+ from wandb.sdk.lib.filenames import REQUIREMENTS_FNAME
1328
+
1329
+ installed_packages_list = sorted(
1330
+ f"{r.name}=={r.version}" for r in record.request.python_packages.package
1331
+ )
1332
+ with open(os.path.join(self._settings.files_dir, REQUIREMENTS_FNAME), "w") as f:
1333
+ f.write("\n".join(installed_packages_list))
1334
+
1335
+ def send_output(self, record: "Record") -> None:
1336
+ if not self._fs:
1337
+ return
1338
+ out = record.output
1339
+ stream: StreamLiterals = "stdout"
1340
+ if out.output_type == wandb_internal_pb2.OutputRecord.OutputType.STDERR:
1341
+ stream = "stderr"
1342
+ line = out.line
1343
+ self._send_output_line(stream, line)
1344
+
1345
+ def send_output_raw(self, record: "Record") -> None:
1346
+ if not self._fs:
1347
+ return
1348
+ out = record.output_raw
1349
+ stream: StreamLiterals = "stdout"
1350
+ if out.output_type == wandb_internal_pb2.OutputRawRecord.OutputType.STDERR:
1351
+ stream = "stderr"
1352
+ line = out.line
1353
+
1354
+ output_raw = self._output_raw_streams.get(stream)
1355
+ if not output_raw:
1356
+ output_raw = _OutputRawStream(stream=stream, sm=self)
1357
+ self._output_raw_streams[stream] = output_raw
1358
+
1359
+ # open the console output file shared between both streams
1360
+ if not self._output_raw_file:
1361
+ output_log_path = os.path.join(
1362
+ self._settings.files_dir, filenames.OUTPUT_FNAME
1363
+ )
1364
+ output_raw_file = None
1365
+ try:
1366
+ output_raw_file = filesystem.CRDedupedFile(
1367
+ open(output_log_path, "wb")
1368
+ )
1369
+ except OSError as e:
1370
+ logger.warning(f"could not open output_raw_file: {e}")
1371
+ if output_raw_file:
1372
+ self._output_raw_file = output_raw_file
1373
+ output_raw.start()
1374
+
1375
+ output_raw._queue.put(line)
1376
+
1377
+ def _send_output_line(self, stream: "StreamLiterals", line: str) -> None:
1378
+ """Combined writer for raw and non raw output lines.
1379
+
1380
+ This is combined because they are both post emulator.
1381
+ """
1382
+ prepend = ""
1383
+ if stream == "stderr":
1384
+ prepend = "ERROR "
1385
+ if not line.endswith("\n"):
1386
+ self._partial_output.setdefault(stream, "")
1387
+ if line.startswith("\r"):
1388
+ # TODO: maybe we shouldnt just drop this, what if there was some \ns in the partial
1389
+ # that should probably be the check instead of not line.endswith(\n")
1390
+ # logger.info(f"Dropping data {self._partial_output[stream]}")
1391
+ self._partial_output[stream] = ""
1392
+ self._partial_output[stream] += line
1393
+ # TODO(jhr): how do we make sure this gets flushed?
1394
+ # we might need this for other stuff like telemetry
1395
+ else:
1396
+ # TODO(jhr): use time from timestamp proto
1397
+ # TODO(jhr): do we need to make sure we write full lines?
1398
+ # seems to be some issues with line breaks
1399
+ cur_time = time.time()
1400
+ timestamp = datetime.utcfromtimestamp(cur_time).isoformat() + " "
1401
+ prev_str = self._partial_output.get(stream, "")
1402
+ line = f"{prepend}{timestamp}{prev_str}{line}"
1403
+ if self._fs:
1404
+ self._fs.push(filenames.OUTPUT_FNAME, line)
1405
+ self._partial_output[stream] = ""
1406
+
1407
+ def _update_config(self) -> None:
1408
+ self._config_needs_debounce = True
1409
+
1410
+ def send_config(self, record: "Record") -> None:
1411
+ self._consolidated_config.update_from_proto(record.config)
1412
+ self._update_config()
1413
+
1414
+ def send_metric(self, record: "Record") -> None:
1415
+ metric = record.metric
1416
+ if metric.glob_name:
1417
+ logger.warning("Seen metric with glob (shouldn't happen)")
1418
+ return
1419
+
1420
+ # merge or overwrite
1421
+ old_metric = self._config_metric_dict.get(
1422
+ metric.name, wandb_internal_pb2.MetricRecord()
1423
+ )
1424
+ if metric._control.overwrite:
1425
+ old_metric.CopyFrom(metric)
1426
+ else:
1427
+ old_metric.MergeFrom(metric)
1428
+ self._config_metric_dict[metric.name] = old_metric
1429
+ metric = old_metric
1430
+
1431
+ # convert step_metric to index
1432
+ if metric.step_metric:
1433
+ find_step_idx = self._config_metric_index_dict.get(metric.step_metric)
1434
+ if find_step_idx is not None:
1435
+ # make a copy of this metric as we will be modifying it
1436
+ rec = wandb_internal_pb2.Record()
1437
+ rec.metric.CopyFrom(metric)
1438
+ metric = rec.metric
1439
+
1440
+ metric.ClearField("step_metric")
1441
+ metric.step_metric_index = find_step_idx + 1
1442
+
1443
+ md: Dict[int, Any] = proto_util.proto_encode_to_dict(metric)
1444
+ find_idx = self._config_metric_index_dict.get(metric.name)
1445
+ if find_idx is not None:
1446
+ self._config_metric_pbdict_list[find_idx] = md
1447
+ else:
1448
+ next_idx = len(self._config_metric_pbdict_list)
1449
+ self._config_metric_pbdict_list.append(md)
1450
+ self._config_metric_index_dict[metric.name] = next_idx
1451
+ self._update_config()
1452
+
1453
+ def _update_telemetry_record(self, telemetry: telemetry.TelemetryRecord) -> None:
1454
+ self._telemetry_obj.MergeFrom(telemetry)
1455
+ self._update_config()
1456
+
1457
+ def send_telemetry(self, record: "Record") -> None:
1458
+ self._update_telemetry_record(record.telemetry)
1459
+
1460
+ def send_request_telemetry_record(self, record: "Record") -> None:
1461
+ self._update_telemetry_record(record.request.telemetry_record.telemetry)
1462
+
1463
+ def _save_file(
1464
+ self, fname: interface.GlobStr, policy: "interface.PolicyName" = "end"
1465
+ ) -> None:
1466
+ logger.info("saving file %s with policy %s", fname, policy)
1467
+ if self._dir_watcher:
1468
+ self._dir_watcher.update_policy(fname, policy)
1469
+
1470
+ def send_files(self, record: "Record") -> None:
1471
+ files = record.files
1472
+ for k in files.files:
1473
+ # TODO(jhr): fix paths with directories
1474
+ self._save_file(
1475
+ interface.GlobStr(k.path), interface.file_enum_to_policy(k.policy)
1476
+ )
1477
+
1478
+ def send_header(self, record: "Record") -> None:
1479
+ pass
1480
+
1481
+ def send_footer(self, record: "Record") -> None:
1482
+ pass
1483
+
1484
+ def send_tbrecord(self, record: "Record") -> None:
1485
+ # tbrecord watching threads are handled by handler.py
1486
+ pass
1487
+
1488
+ def send_request_link_artifact(self, record: "Record") -> None:
1489
+ if not (record.control.req_resp or record.control.mailbox_slot):
1490
+ raise ValueError(
1491
+ f"Expected either `req_resp` or `mailbox_slot`, got: {record.control!r}"
1492
+ )
1493
+ result = proto_util._result_from_record(record)
1494
+ link = record.request.link_artifact
1495
+ client_id = link.client_id
1496
+ server_id = link.server_id
1497
+ portfolio_name = link.portfolio_name
1498
+ entity = link.portfolio_entity
1499
+ project = link.portfolio_project
1500
+ aliases = link.portfolio_aliases
1501
+ logger.debug(
1502
+ f"link_artifact params - client_id={client_id}, server_id={server_id}, pfolio={portfolio_name}, entity={entity}, project={project}"
1503
+ )
1504
+ if (client_id or server_id) and portfolio_name and entity and project:
1505
+ try:
1506
+ self._api.link_artifact(
1507
+ client_id, server_id, portfolio_name, entity, project, aliases
1508
+ )
1509
+ except Exception as e:
1510
+ result.response.log_artifact_response.error_message = f'error linking artifact to "{entity}/{project}/{portfolio_name}"; error: {e}'
1511
+ logger.warning("Failed to link artifact to portfolio: %s", e)
1512
+ self._respond_result(result)
1513
+
1514
+ def send_use_artifact(self, record: "Record") -> None:
1515
+ """Pretend to send a used artifact.
1516
+
1517
+ This function doesn't actually send anything, it is just used internally.
1518
+ """
1519
+ use = record.use_artifact
1520
+
1521
+ if use.type == "job" and not use.partial.job_name:
1522
+ self._job_builder.disable = True
1523
+ elif use.partial.job_name:
1524
+ # job is partial, let job builder rebuild job, set job source dict
1525
+ self._job_builder.set_partial_source_id(use.id)
1526
+
1527
+ def send_request_log_artifact(self, record: "Record") -> None:
1528
+ assert record.control.req_resp
1529
+ result = proto_util._result_from_record(record)
1530
+ artifact = record.request.log_artifact.artifact
1531
+ history_step = record.request.log_artifact.history_step
1532
+
1533
+ try:
1534
+ res = self._send_artifact(artifact, history_step)
1535
+ assert res, "Unable to send artifact"
1536
+ result.response.log_artifact_response.artifact_id = res["id"]
1537
+ logger.info(f"logged artifact {artifact.name} - {res}")
1538
+ except Exception as e:
1539
+ result.response.log_artifact_response.error_message = (
1540
+ f'error logging artifact "{artifact.type}/{artifact.name}": {e}'
1541
+ )
1542
+
1543
+ self._respond_result(result)
1544
+
1545
+ def send_artifact(self, record: "Record") -> None:
1546
+ artifact = record.artifact
1547
+ try:
1548
+ res = self._send_artifact(artifact)
1549
+ logger.info(f"sent artifact {artifact.name} - {res}")
1550
+ except Exception as e:
1551
+ logger.error(
1552
+ 'send_artifact: failed for artifact "{}/{}": {}'.format(
1553
+ artifact.type, artifact.name, e
1554
+ )
1555
+ )
1556
+
1557
+ def _send_artifact(
1558
+ self, artifact: "ArtifactRecord", history_step: Optional[int] = None
1559
+ ) -> Optional[Dict]:
1560
+ from wandb.util import parse_version
1561
+
1562
+ assert self._pusher
1563
+ saver = ArtifactSaver(
1564
+ api=self._api,
1565
+ digest=artifact.digest,
1566
+ manifest_json=_manifest_json_from_proto(artifact.manifest),
1567
+ file_pusher=self._pusher,
1568
+ is_user_created=artifact.user_created,
1569
+ )
1570
+
1571
+ if artifact.distributed_id:
1572
+ max_cli_version = self._max_cli_version()
1573
+ if max_cli_version is None or parse_version(
1574
+ max_cli_version
1575
+ ) < parse_version("0.10.16"):
1576
+ logger.warning(
1577
+ "This W&B Server doesn't support distributed artifacts, "
1578
+ "have your administrator install wandb/local >= 0.9.37"
1579
+ )
1580
+ return None
1581
+
1582
+ metadata = json.loads(artifact.metadata) if artifact.metadata else None
1583
+ res = saver.save(
1584
+ type=artifact.type,
1585
+ name=artifact.name,
1586
+ client_id=artifact.client_id,
1587
+ sequence_client_id=artifact.sequence_client_id,
1588
+ metadata=metadata,
1589
+ ttl_duration_seconds=artifact.ttl_duration_seconds or None,
1590
+ description=artifact.description or None,
1591
+ aliases=artifact.aliases,
1592
+ tags=artifact.tags,
1593
+ use_after_commit=artifact.use_after_commit,
1594
+ distributed_id=artifact.distributed_id,
1595
+ finalize=artifact.finalize,
1596
+ incremental=artifact.incremental_beta1,
1597
+ history_step=history_step,
1598
+ base_id=artifact.base_id or None,
1599
+ )
1600
+
1601
+ self._job_builder._handle_server_artifact(res, artifact)
1602
+
1603
+ if artifact.manifest.manifest_file_path:
1604
+ with contextlib.suppress(FileNotFoundError):
1605
+ os.remove(artifact.manifest.manifest_file_path)
1606
+ return res
1607
+
1608
+ def send_alert(self, record: "Record") -> None:
1609
+ from wandb.util import parse_version
1610
+
1611
+ alert = record.alert
1612
+ max_cli_version = self._max_cli_version()
1613
+ if max_cli_version is None or parse_version(max_cli_version) < parse_version(
1614
+ "0.10.9"
1615
+ ):
1616
+ logger.warning(
1617
+ "This W&B server doesn't support alerts, "
1618
+ "have your administrator install wandb/local >= 0.9.31"
1619
+ )
1620
+ else:
1621
+ try:
1622
+ self._api.notify_scriptable_run_alert(
1623
+ title=alert.title,
1624
+ text=alert.text,
1625
+ level=alert.level,
1626
+ wait_duration=alert.wait_duration,
1627
+ )
1628
+ except Exception as e:
1629
+ logger.error(f"send_alert: failed for alert {alert.title!r}: {e}")
1630
+
1631
+ def finish(self) -> None:
1632
+ logger.info("shutting down sender")
1633
+ # if self._tb_watcher:
1634
+ # self._tb_watcher.finish()
1635
+ self._output_raw_finish()
1636
+ if self._dir_watcher:
1637
+ self._dir_watcher.finish()
1638
+ self._dir_watcher = None
1639
+ if self._pusher:
1640
+ self._pusher.finish()
1641
+ self._pusher.join()
1642
+ self._pusher = None
1643
+ if self._fs:
1644
+ self._fs.finish(self._exit_code)
1645
+ self._fs = None
1646
+ wandb._sentry.end_session()
1647
+
1648
+ def _max_cli_version(self) -> Optional[str]:
1649
+ server_info = self.get_server_info()
1650
+ max_cli_version = server_info.get("cliVersionInfo", {}).get(
1651
+ "max_cli_version", None
1652
+ )
1653
+ if not isinstance(max_cli_version, str):
1654
+ return None
1655
+ return max_cli_version
1656
+
1657
+ def get_viewer_server_info(self) -> None:
1658
+ if self._cached_server_info and self._cached_viewer:
1659
+ return
1660
+ self._cached_viewer, self._cached_server_info = self._api.viewer_server_info()
1661
+
1662
+ def get_viewer_info(self) -> Dict[str, Any]:
1663
+ if not self._cached_viewer:
1664
+ self.get_viewer_server_info()
1665
+ return self._cached_viewer
1666
+
1667
+ def get_server_info(self) -> Dict[str, Any]:
1668
+ if not self._cached_server_info:
1669
+ self.get_viewer_server_info()
1670
+ return self._cached_server_info
1671
+
1672
+ def get_local_info(self) -> "LocalInfo":
1673
+ """Queries the server to get the local version information.
1674
+
1675
+ First, we perform an introspection, if it returns empty we deduce that the
1676
+ docker image is out-of-date. Otherwise, we use the returned values to deduce the
1677
+ state of the local server.
1678
+ """
1679
+ local_info = wandb_internal_pb2.LocalInfo()
1680
+ if self._settings._offline:
1681
+ local_info.out_of_date = False
1682
+ return local_info
1683
+
1684
+ latest_local_version = "latest"
1685
+
1686
+ # Assuming the query is successful if the result is empty it indicates that
1687
+ # the backend is out of date since it doesn't have the desired field
1688
+ server_info = self.get_server_info()
1689
+ latest_local_version_info = server_info.get("latestLocalVersionInfo", {})
1690
+ if latest_local_version_info is None:
1691
+ local_info.out_of_date = False
1692
+ else:
1693
+ local_info.out_of_date = latest_local_version_info.get("outOfDate", True)
1694
+ local_info.version = latest_local_version_info.get(
1695
+ "latestVersionString", latest_local_version
1696
+ )
1697
+ return local_info
1698
+
1699
+ def _flush_job(self) -> None:
1700
+ if self._job_builder.disable or self._settings._offline:
1701
+ return
1702
+ self._job_builder.set_config(self._consolidated_config.non_internal_config())
1703
+ summary_dict = self._cached_summary.copy()
1704
+ summary_dict.pop("_wandb", None)
1705
+ self._job_builder.set_summary(summary_dict)
1706
+
1707
+ artifact = self._job_builder.build(api=self._api)
1708
+ if artifact is not None and self._run is not None:
1709
+ proto_artifact = self._interface._make_artifact(artifact)
1710
+ proto_artifact.run_id = self._run.run_id
1711
+ proto_artifact.project = self._run.project
1712
+ proto_artifact.entity = self._run.entity
1713
+ # TODO: this should be removed when the latest tag is handled
1714
+ # by the backend (WB-12116)
1715
+ proto_artifact.aliases.append("latest")
1716
+ # add docker image tag
1717
+ for alias in self._job_builder._aliases:
1718
+ proto_artifact.aliases.append(alias)
1719
+
1720
+ proto_artifact.user_created = True
1721
+ proto_artifact.use_after_commit = True
1722
+ proto_artifact.finalize = True
1723
+
1724
+ self._interface._publish_artifact(proto_artifact)
1725
+
1726
+ def __next__(self) -> "Record":
1727
+ return self._record_q.get(block=True)
1728
+
1729
+ next = __next__