wandb 0.17.0__py3-none-macosx_11_0_arm64.whl

Sign up to get free protection for your applications and to get access to all the features.
Files changed (833) hide show
  1. package_readme.md +95 -0
  2. wandb/__init__.py +252 -0
  3. wandb/__main__.py +3 -0
  4. wandb/_globals.py +19 -0
  5. wandb/agents/__init__.py +0 -0
  6. wandb/agents/pyagent.py +364 -0
  7. wandb/analytics/__init__.py +3 -0
  8. wandb/analytics/sentry.py +266 -0
  9. wandb/apis/__init__.py +48 -0
  10. wandb/apis/attrs.py +40 -0
  11. wandb/apis/importers/__init__.py +1 -0
  12. wandb/apis/importers/internals/internal.py +385 -0
  13. wandb/apis/importers/internals/protocols.py +99 -0
  14. wandb/apis/importers/internals/util.py +78 -0
  15. wandb/apis/importers/mlflow.py +254 -0
  16. wandb/apis/importers/validation.py +108 -0
  17. wandb/apis/importers/wandb.py +1598 -0
  18. wandb/apis/internal.py +225 -0
  19. wandb/apis/normalize.py +89 -0
  20. wandb/apis/paginator.py +81 -0
  21. wandb/apis/public/__init__.py +34 -0
  22. wandb/apis/public/api.py +1096 -0
  23. wandb/apis/public/artifacts.py +851 -0
  24. wandb/apis/public/const.py +4 -0
  25. wandb/apis/public/files.py +195 -0
  26. wandb/apis/public/history.py +149 -0
  27. wandb/apis/public/jobs.py +646 -0
  28. wandb/apis/public/projects.py +162 -0
  29. wandb/apis/public/query_generator.py +166 -0
  30. wandb/apis/public/reports.py +469 -0
  31. wandb/apis/public/runs.py +800 -0
  32. wandb/apis/public/sweeps.py +240 -0
  33. wandb/apis/public/teams.py +198 -0
  34. wandb/apis/public/users.py +136 -0
  35. wandb/apis/reports/__init__.py +7 -0
  36. wandb/apis/reports/v1/__init__.py +30 -0
  37. wandb/apis/reports/v1/_blocks.py +1406 -0
  38. wandb/apis/reports/v1/_helpers.py +70 -0
  39. wandb/apis/reports/v1/_panels.py +1282 -0
  40. wandb/apis/reports/v1/_templates.py +478 -0
  41. wandb/apis/reports/v1/blocks.py +27 -0
  42. wandb/apis/reports/v1/helpers.py +2 -0
  43. wandb/apis/reports/v1/mutations.py +66 -0
  44. wandb/apis/reports/v1/panels.py +17 -0
  45. wandb/apis/reports/v1/report.py +268 -0
  46. wandb/apis/reports/v1/runset.py +144 -0
  47. wandb/apis/reports/v1/templates.py +7 -0
  48. wandb/apis/reports/v1/util.py +406 -0
  49. wandb/apis/reports/v1/validators.py +131 -0
  50. wandb/apis/reports/v2/__init__.py +20 -0
  51. wandb/apis/reports/v2/blocks.py +25 -0
  52. wandb/apis/reports/v2/expr_parsing.py +257 -0
  53. wandb/apis/reports/v2/gql.py +68 -0
  54. wandb/apis/reports/v2/interface.py +1911 -0
  55. wandb/apis/reports/v2/internal.py +867 -0
  56. wandb/apis/reports/v2/metrics.py +6 -0
  57. wandb/apis/reports/v2/panels.py +15 -0
  58. wandb/beta/workflows.py +283 -0
  59. wandb/bin/apple_gpu_stats +0 -0
  60. wandb/bin/wandb-core +0 -0
  61. wandb/cli/__init__.py +0 -0
  62. wandb/cli/cli.py +2960 -0
  63. wandb/data_types.py +2071 -0
  64. wandb/docker/__init__.py +342 -0
  65. wandb/docker/auth.py +436 -0
  66. wandb/docker/wandb-entrypoint.sh +33 -0
  67. wandb/docker/www_authenticate.py +94 -0
  68. wandb/env.py +496 -0
  69. wandb/errors/__init__.py +46 -0
  70. wandb/errors/term.py +103 -0
  71. wandb/errors/util.py +57 -0
  72. wandb/filesync/__init__.py +0 -0
  73. wandb/filesync/dir_watcher.py +403 -0
  74. wandb/filesync/stats.py +100 -0
  75. wandb/filesync/step_checksum.py +142 -0
  76. wandb/filesync/step_prepare.py +179 -0
  77. wandb/filesync/step_upload.py +290 -0
  78. wandb/filesync/upload_job.py +142 -0
  79. wandb/integration/__init__.py +0 -0
  80. wandb/integration/catboost/__init__.py +5 -0
  81. wandb/integration/catboost/catboost.py +178 -0
  82. wandb/integration/cohere/__init__.py +3 -0
  83. wandb/integration/cohere/cohere.py +21 -0
  84. wandb/integration/cohere/resolver.py +347 -0
  85. wandb/integration/diffusers/__init__.py +3 -0
  86. wandb/integration/diffusers/autologger.py +76 -0
  87. wandb/integration/diffusers/pipeline_resolver.py +50 -0
  88. wandb/integration/diffusers/resolvers/__init__.py +9 -0
  89. wandb/integration/diffusers/resolvers/multimodal.py +882 -0
  90. wandb/integration/diffusers/resolvers/utils.py +102 -0
  91. wandb/integration/fastai/__init__.py +249 -0
  92. wandb/integration/gym/__init__.py +85 -0
  93. wandb/integration/huggingface/__init__.py +3 -0
  94. wandb/integration/huggingface/huggingface.py +18 -0
  95. wandb/integration/huggingface/resolver.py +213 -0
  96. wandb/integration/keras/__init__.py +14 -0
  97. wandb/integration/keras/callbacks/__init__.py +5 -0
  98. wandb/integration/keras/callbacks/metrics_logger.py +130 -0
  99. wandb/integration/keras/callbacks/model_checkpoint.py +200 -0
  100. wandb/integration/keras/callbacks/tables_builder.py +226 -0
  101. wandb/integration/keras/keras.py +1080 -0
  102. wandb/integration/kfp/__init__.py +6 -0
  103. wandb/integration/kfp/helpers.py +28 -0
  104. wandb/integration/kfp/kfp_patch.py +324 -0
  105. wandb/integration/kfp/wandb_logging.py +182 -0
  106. wandb/integration/langchain/__init__.py +3 -0
  107. wandb/integration/langchain/wandb_tracer.py +48 -0
  108. wandb/integration/lightgbm/__init__.py +239 -0
  109. wandb/integration/lightning/__init__.py +0 -0
  110. wandb/integration/lightning/fabric/__init__.py +3 -0
  111. wandb/integration/lightning/fabric/logger.py +762 -0
  112. wandb/integration/magic.py +556 -0
  113. wandb/integration/metaflow/__init__.py +3 -0
  114. wandb/integration/metaflow/metaflow.py +383 -0
  115. wandb/integration/openai/__init__.py +3 -0
  116. wandb/integration/openai/fine_tuning.py +454 -0
  117. wandb/integration/openai/openai.py +22 -0
  118. wandb/integration/openai/resolver.py +240 -0
  119. wandb/integration/prodigy/__init__.py +3 -0
  120. wandb/integration/prodigy/prodigy.py +299 -0
  121. wandb/integration/sacred/__init__.py +117 -0
  122. wandb/integration/sagemaker/__init__.py +12 -0
  123. wandb/integration/sagemaker/auth.py +28 -0
  124. wandb/integration/sagemaker/config.py +49 -0
  125. wandb/integration/sagemaker/files.py +3 -0
  126. wandb/integration/sagemaker/resources.py +34 -0
  127. wandb/integration/sb3/__init__.py +3 -0
  128. wandb/integration/sb3/sb3.py +153 -0
  129. wandb/integration/tensorboard/__init__.py +10 -0
  130. wandb/integration/tensorboard/log.py +358 -0
  131. wandb/integration/tensorboard/monkeypatch.py +185 -0
  132. wandb/integration/tensorflow/__init__.py +5 -0
  133. wandb/integration/tensorflow/estimator_hook.py +54 -0
  134. wandb/integration/torch/__init__.py +0 -0
  135. wandb/integration/ultralytics/__init__.py +11 -0
  136. wandb/integration/ultralytics/bbox_utils.py +208 -0
  137. wandb/integration/ultralytics/callback.py +524 -0
  138. wandb/integration/ultralytics/classification_utils.py +83 -0
  139. wandb/integration/ultralytics/mask_utils.py +202 -0
  140. wandb/integration/ultralytics/pose_utils.py +104 -0
  141. wandb/integration/xgboost/__init__.py +11 -0
  142. wandb/integration/xgboost/xgboost.py +189 -0
  143. wandb/integration/yolov8/__init__.py +0 -0
  144. wandb/integration/yolov8/yolov8.py +284 -0
  145. wandb/jupyter.py +501 -0
  146. wandb/magic.py +3 -0
  147. wandb/mpmain/__init__.py +0 -0
  148. wandb/mpmain/__main__.py +1 -0
  149. wandb/old/__init__.py +0 -0
  150. wandb/old/core.py +131 -0
  151. wandb/old/settings.py +173 -0
  152. wandb/old/summary.py +435 -0
  153. wandb/plot/__init__.py +19 -0
  154. wandb/plot/bar.py +42 -0
  155. wandb/plot/confusion_matrix.py +99 -0
  156. wandb/plot/histogram.py +36 -0
  157. wandb/plot/line.py +40 -0
  158. wandb/plot/line_series.py +88 -0
  159. wandb/plot/pr_curve.py +136 -0
  160. wandb/plot/roc_curve.py +118 -0
  161. wandb/plot/scatter.py +32 -0
  162. wandb/plot/utils.py +183 -0
  163. wandb/proto/__init__.py +0 -0
  164. wandb/proto/v3/__init__.py +0 -0
  165. wandb/proto/v3/wandb_base_pb2.py +54 -0
  166. wandb/proto/v3/wandb_internal_pb2.py +1586 -0
  167. wandb/proto/v3/wandb_server_pb2.py +207 -0
  168. wandb/proto/v3/wandb_settings_pb2.py +111 -0
  169. wandb/proto/v3/wandb_telemetry_pb2.py +105 -0
  170. wandb/proto/v4/__init__.py +0 -0
  171. wandb/proto/v4/wandb_base_pb2.py +29 -0
  172. wandb/proto/v4/wandb_internal_pb2.py +354 -0
  173. wandb/proto/v4/wandb_server_pb2.py +62 -0
  174. wandb/proto/v4/wandb_settings_pb2.py +44 -0
  175. wandb/proto/v4/wandb_telemetry_pb2.py +40 -0
  176. wandb/proto/wandb_base_pb2.py +8 -0
  177. wandb/proto/wandb_deprecated.py +43 -0
  178. wandb/proto/wandb_internal_codegen.py +82 -0
  179. wandb/proto/wandb_internal_pb2.py +8 -0
  180. wandb/proto/wandb_server_pb2.py +8 -0
  181. wandb/proto/wandb_settings_pb2.py +8 -0
  182. wandb/proto/wandb_telemetry_pb2.py +8 -0
  183. wandb/py.typed +0 -0
  184. wandb/sdk/__init__.py +37 -0
  185. wandb/sdk/artifacts/__init__.py +0 -0
  186. wandb/sdk/artifacts/artifact.py +2320 -0
  187. wandb/sdk/artifacts/artifact_download_logger.py +43 -0
  188. wandb/sdk/artifacts/artifact_file_cache.py +229 -0
  189. wandb/sdk/artifacts/artifact_instance_cache.py +15 -0
  190. wandb/sdk/artifacts/artifact_manifest.py +72 -0
  191. wandb/sdk/artifacts/artifact_manifest_entry.py +208 -0
  192. wandb/sdk/artifacts/artifact_manifests/__init__.py +0 -0
  193. wandb/sdk/artifacts/artifact_manifests/artifact_manifest_v1.py +90 -0
  194. wandb/sdk/artifacts/artifact_saver.py +261 -0
  195. wandb/sdk/artifacts/artifact_state.py +11 -0
  196. wandb/sdk/artifacts/artifact_ttl.py +7 -0
  197. wandb/sdk/artifacts/exceptions.py +56 -0
  198. wandb/sdk/artifacts/staging.py +25 -0
  199. wandb/sdk/artifacts/storage_handler.py +60 -0
  200. wandb/sdk/artifacts/storage_handlers/__init__.py +0 -0
  201. wandb/sdk/artifacts/storage_handlers/azure_handler.py +194 -0
  202. wandb/sdk/artifacts/storage_handlers/gcs_handler.py +195 -0
  203. wandb/sdk/artifacts/storage_handlers/http_handler.py +113 -0
  204. wandb/sdk/artifacts/storage_handlers/local_file_handler.py +135 -0
  205. wandb/sdk/artifacts/storage_handlers/multi_handler.py +54 -0
  206. wandb/sdk/artifacts/storage_handlers/s3_handler.py +300 -0
  207. wandb/sdk/artifacts/storage_handlers/tracking_handler.py +68 -0
  208. wandb/sdk/artifacts/storage_handlers/wb_artifact_handler.py +133 -0
  209. wandb/sdk/artifacts/storage_handlers/wb_local_artifact_handler.py +72 -0
  210. wandb/sdk/artifacts/storage_layout.py +6 -0
  211. wandb/sdk/artifacts/storage_policies/__init__.py +4 -0
  212. wandb/sdk/artifacts/storage_policies/register.py +1 -0
  213. wandb/sdk/artifacts/storage_policies/wandb_storage_policy.py +371 -0
  214. wandb/sdk/artifacts/storage_policy.py +72 -0
  215. wandb/sdk/backend/__init__.py +0 -0
  216. wandb/sdk/backend/backend.py +240 -0
  217. wandb/sdk/data_types/__init__.py +0 -0
  218. wandb/sdk/data_types/_dtypes.py +911 -0
  219. wandb/sdk/data_types/_private.py +10 -0
  220. wandb/sdk/data_types/base_types/__init__.py +0 -0
  221. wandb/sdk/data_types/base_types/json_metadata.py +55 -0
  222. wandb/sdk/data_types/base_types/media.py +313 -0
  223. wandb/sdk/data_types/base_types/wb_value.py +274 -0
  224. wandb/sdk/data_types/helper_types/__init__.py +0 -0
  225. wandb/sdk/data_types/helper_types/bounding_boxes_2d.py +293 -0
  226. wandb/sdk/data_types/helper_types/classes.py +159 -0
  227. wandb/sdk/data_types/helper_types/image_mask.py +233 -0
  228. wandb/sdk/data_types/histogram.py +96 -0
  229. wandb/sdk/data_types/html.py +115 -0
  230. wandb/sdk/data_types/image.py +687 -0
  231. wandb/sdk/data_types/molecule.py +241 -0
  232. wandb/sdk/data_types/object_3d.py +363 -0
  233. wandb/sdk/data_types/plotly.py +82 -0
  234. wandb/sdk/data_types/saved_model.py +444 -0
  235. wandb/sdk/data_types/trace_tree.py +438 -0
  236. wandb/sdk/data_types/utils.py +180 -0
  237. wandb/sdk/data_types/video.py +245 -0
  238. wandb/sdk/integration_utils/__init__.py +0 -0
  239. wandb/sdk/integration_utils/auto_logging.py +239 -0
  240. wandb/sdk/integration_utils/data_logging.py +475 -0
  241. wandb/sdk/interface/__init__.py +0 -0
  242. wandb/sdk/interface/constants.py +4 -0
  243. wandb/sdk/interface/interface.py +962 -0
  244. wandb/sdk/interface/interface_queue.py +59 -0
  245. wandb/sdk/interface/interface_relay.py +53 -0
  246. wandb/sdk/interface/interface_shared.py +550 -0
  247. wandb/sdk/interface/interface_sock.py +61 -0
  248. wandb/sdk/interface/message_future.py +27 -0
  249. wandb/sdk/interface/message_future_poll.py +50 -0
  250. wandb/sdk/interface/router.py +118 -0
  251. wandb/sdk/interface/router_queue.py +44 -0
  252. wandb/sdk/interface/router_relay.py +39 -0
  253. wandb/sdk/interface/router_sock.py +36 -0
  254. wandb/sdk/interface/summary_record.py +67 -0
  255. wandb/sdk/internal/__init__.py +0 -0
  256. wandb/sdk/internal/context.py +89 -0
  257. wandb/sdk/internal/datastore.py +297 -0
  258. wandb/sdk/internal/file_pusher.py +181 -0
  259. wandb/sdk/internal/file_stream.py +695 -0
  260. wandb/sdk/internal/flow_control.py +263 -0
  261. wandb/sdk/internal/handler.py +909 -0
  262. wandb/sdk/internal/internal.py +417 -0
  263. wandb/sdk/internal/internal_api.py +4074 -0
  264. wandb/sdk/internal/internal_util.py +100 -0
  265. wandb/sdk/internal/job_builder.py +667 -0
  266. wandb/sdk/internal/profiler.py +78 -0
  267. wandb/sdk/internal/progress.py +83 -0
  268. wandb/sdk/internal/run.py +25 -0
  269. wandb/sdk/internal/sample.py +70 -0
  270. wandb/sdk/internal/sender.py +1641 -0
  271. wandb/sdk/internal/sender_config.py +197 -0
  272. wandb/sdk/internal/settings_static.py +83 -0
  273. wandb/sdk/internal/system/__init__.py +0 -0
  274. wandb/sdk/internal/system/assets/__init__.py +27 -0
  275. wandb/sdk/internal/system/assets/aggregators.py +37 -0
  276. wandb/sdk/internal/system/assets/asset_registry.py +20 -0
  277. wandb/sdk/internal/system/assets/cpu.py +163 -0
  278. wandb/sdk/internal/system/assets/disk.py +210 -0
  279. wandb/sdk/internal/system/assets/gpu.py +414 -0
  280. wandb/sdk/internal/system/assets/gpu_amd.py +230 -0
  281. wandb/sdk/internal/system/assets/gpu_apple.py +177 -0
  282. wandb/sdk/internal/system/assets/interfaces.py +207 -0
  283. wandb/sdk/internal/system/assets/ipu.py +177 -0
  284. wandb/sdk/internal/system/assets/memory.py +166 -0
  285. wandb/sdk/internal/system/assets/network.py +125 -0
  286. wandb/sdk/internal/system/assets/open_metrics.py +299 -0
  287. wandb/sdk/internal/system/assets/tpu.py +154 -0
  288. wandb/sdk/internal/system/assets/trainium.py +398 -0
  289. wandb/sdk/internal/system/env_probe_helpers.py +13 -0
  290. wandb/sdk/internal/system/system_info.py +247 -0
  291. wandb/sdk/internal/system/system_monitor.py +229 -0
  292. wandb/sdk/internal/tb_watcher.py +518 -0
  293. wandb/sdk/internal/thread_local_settings.py +18 -0
  294. wandb/sdk/internal/update.py +113 -0
  295. wandb/sdk/internal/writer.py +206 -0
  296. wandb/sdk/launch/__init__.py +14 -0
  297. wandb/sdk/launch/_launch.py +328 -0
  298. wandb/sdk/launch/_launch_add.py +255 -0
  299. wandb/sdk/launch/_project_spec.py +538 -0
  300. wandb/sdk/launch/agent/__init__.py +5 -0
  301. wandb/sdk/launch/agent/agent.py +901 -0
  302. wandb/sdk/launch/agent/config.py +296 -0
  303. wandb/sdk/launch/agent/job_status_tracker.py +53 -0
  304. wandb/sdk/launch/agent/run_queue_item_file_saver.py +47 -0
  305. wandb/sdk/launch/builder/__init__.py +0 -0
  306. wandb/sdk/launch/builder/abstract.py +156 -0
  307. wandb/sdk/launch/builder/build.py +280 -0
  308. wandb/sdk/launch/builder/context_manager.py +235 -0
  309. wandb/sdk/launch/builder/docker_builder.py +177 -0
  310. wandb/sdk/launch/builder/kaniko_builder.py +566 -0
  311. wandb/sdk/launch/builder/noop.py +58 -0
  312. wandb/sdk/launch/builder/templates/_wandb_bootstrap.py +187 -0
  313. wandb/sdk/launch/builder/templates/dockerfile.py +92 -0
  314. wandb/sdk/launch/create_job.py +512 -0
  315. wandb/sdk/launch/environment/abstract.py +29 -0
  316. wandb/sdk/launch/environment/aws_environment.py +297 -0
  317. wandb/sdk/launch/environment/azure_environment.py +105 -0
  318. wandb/sdk/launch/environment/gcp_environment.py +335 -0
  319. wandb/sdk/launch/environment/local_environment.py +66 -0
  320. wandb/sdk/launch/errors.py +19 -0
  321. wandb/sdk/launch/git_reference.py +109 -0
  322. wandb/sdk/launch/inputs/files.py +148 -0
  323. wandb/sdk/launch/inputs/internal.py +217 -0
  324. wandb/sdk/launch/inputs/manage.py +95 -0
  325. wandb/sdk/launch/loader.py +249 -0
  326. wandb/sdk/launch/registry/abstract.py +48 -0
  327. wandb/sdk/launch/registry/anon.py +29 -0
  328. wandb/sdk/launch/registry/azure_container_registry.py +124 -0
  329. wandb/sdk/launch/registry/elastic_container_registry.py +192 -0
  330. wandb/sdk/launch/registry/google_artifact_registry.py +219 -0
  331. wandb/sdk/launch/registry/local_registry.py +67 -0
  332. wandb/sdk/launch/runner/__init__.py +0 -0
  333. wandb/sdk/launch/runner/abstract.py +195 -0
  334. wandb/sdk/launch/runner/kubernetes_monitor.py +441 -0
  335. wandb/sdk/launch/runner/kubernetes_runner.py +891 -0
  336. wandb/sdk/launch/runner/local_container.py +298 -0
  337. wandb/sdk/launch/runner/local_process.py +78 -0
  338. wandb/sdk/launch/runner/sagemaker_runner.py +422 -0
  339. wandb/sdk/launch/runner/vertex_runner.py +230 -0
  340. wandb/sdk/launch/sweeps/__init__.py +39 -0
  341. wandb/sdk/launch/sweeps/scheduler.py +738 -0
  342. wandb/sdk/launch/sweeps/scheduler_sweep.py +91 -0
  343. wandb/sdk/launch/sweeps/utils.py +316 -0
  344. wandb/sdk/launch/utils.py +741 -0
  345. wandb/sdk/launch/wandb_reference.py +138 -0
  346. wandb/sdk/lib/__init__.py +5 -0
  347. wandb/sdk/lib/_settings_toposort_generate.py +159 -0
  348. wandb/sdk/lib/_settings_toposort_generated.py +239 -0
  349. wandb/sdk/lib/_wburls_generate.py +25 -0
  350. wandb/sdk/lib/_wburls_generated.py +22 -0
  351. wandb/sdk/lib/apikey.py +258 -0
  352. wandb/sdk/lib/capped_dict.py +26 -0
  353. wandb/sdk/lib/config_util.py +101 -0
  354. wandb/sdk/lib/console.py +39 -0
  355. wandb/sdk/lib/deprecate.py +42 -0
  356. wandb/sdk/lib/disabled.py +190 -0
  357. wandb/sdk/lib/exit_hooks.py +54 -0
  358. wandb/sdk/lib/file_stream_utils.py +118 -0
  359. wandb/sdk/lib/filenames.py +64 -0
  360. wandb/sdk/lib/filesystem.py +372 -0
  361. wandb/sdk/lib/fsm.py +174 -0
  362. wandb/sdk/lib/gitlib.py +239 -0
  363. wandb/sdk/lib/gql_request.py +65 -0
  364. wandb/sdk/lib/handler_util.py +21 -0
  365. wandb/sdk/lib/hashutil.py +62 -0
  366. wandb/sdk/lib/import_hooks.py +275 -0
  367. wandb/sdk/lib/ipython.py +146 -0
  368. wandb/sdk/lib/json_util.py +80 -0
  369. wandb/sdk/lib/lazyloader.py +63 -0
  370. wandb/sdk/lib/mailbox.py +460 -0
  371. wandb/sdk/lib/module.py +69 -0
  372. wandb/sdk/lib/paths.py +106 -0
  373. wandb/sdk/lib/preinit.py +42 -0
  374. wandb/sdk/lib/printer.py +313 -0
  375. wandb/sdk/lib/proto_util.py +90 -0
  376. wandb/sdk/lib/redirect.py +845 -0
  377. wandb/sdk/lib/reporting.py +99 -0
  378. wandb/sdk/lib/retry.py +289 -0
  379. wandb/sdk/lib/run_moment.py +78 -0
  380. wandb/sdk/lib/runid.py +12 -0
  381. wandb/sdk/lib/server.py +52 -0
  382. wandb/sdk/lib/sock_client.py +291 -0
  383. wandb/sdk/lib/sparkline.py +45 -0
  384. wandb/sdk/lib/telemetry.py +100 -0
  385. wandb/sdk/lib/timed_input.py +133 -0
  386. wandb/sdk/lib/timer.py +19 -0
  387. wandb/sdk/lib/tracelog.py +255 -0
  388. wandb/sdk/lib/wburls.py +46 -0
  389. wandb/sdk/service/__init__.py +0 -0
  390. wandb/sdk/service/_startup_debug.py +22 -0
  391. wandb/sdk/service/port_file.py +53 -0
  392. wandb/sdk/service/server.py +119 -0
  393. wandb/sdk/service/server_sock.py +276 -0
  394. wandb/sdk/service/service.py +267 -0
  395. wandb/sdk/service/service_base.py +50 -0
  396. wandb/sdk/service/service_sock.py +70 -0
  397. wandb/sdk/service/streams.py +426 -0
  398. wandb/sdk/verify/__init__.py +0 -0
  399. wandb/sdk/verify/verify.py +501 -0
  400. wandb/sdk/wandb_alerts.py +12 -0
  401. wandb/sdk/wandb_config.py +319 -0
  402. wandb/sdk/wandb_helper.py +54 -0
  403. wandb/sdk/wandb_init.py +1179 -0
  404. wandb/sdk/wandb_login.py +339 -0
  405. wandb/sdk/wandb_manager.py +222 -0
  406. wandb/sdk/wandb_metric.py +110 -0
  407. wandb/sdk/wandb_require.py +92 -0
  408. wandb/sdk/wandb_require_helpers.py +44 -0
  409. wandb/sdk/wandb_run.py +4247 -0
  410. wandb/sdk/wandb_settings.py +1926 -0
  411. wandb/sdk/wandb_setup.py +335 -0
  412. wandb/sdk/wandb_summary.py +150 -0
  413. wandb/sdk/wandb_sweep.py +114 -0
  414. wandb/sdk/wandb_sync.py +75 -0
  415. wandb/sdk/wandb_watch.py +128 -0
  416. wandb/sklearn/__init__.py +37 -0
  417. wandb/sklearn/calculate/__init__.py +32 -0
  418. wandb/sklearn/calculate/calibration_curves.py +125 -0
  419. wandb/sklearn/calculate/class_proportions.py +68 -0
  420. wandb/sklearn/calculate/confusion_matrix.py +92 -0
  421. wandb/sklearn/calculate/decision_boundaries.py +40 -0
  422. wandb/sklearn/calculate/elbow_curve.py +55 -0
  423. wandb/sklearn/calculate/feature_importances.py +67 -0
  424. wandb/sklearn/calculate/learning_curve.py +64 -0
  425. wandb/sklearn/calculate/outlier_candidates.py +69 -0
  426. wandb/sklearn/calculate/residuals.py +86 -0
  427. wandb/sklearn/calculate/silhouette.py +118 -0
  428. wandb/sklearn/calculate/summary_metrics.py +62 -0
  429. wandb/sklearn/plot/__init__.py +35 -0
  430. wandb/sklearn/plot/classifier.py +329 -0
  431. wandb/sklearn/plot/clusterer.py +142 -0
  432. wandb/sklearn/plot/regressor.py +121 -0
  433. wandb/sklearn/plot/shared.py +91 -0
  434. wandb/sklearn/utils.py +183 -0
  435. wandb/sync/__init__.py +3 -0
  436. wandb/sync/sync.py +443 -0
  437. wandb/testing/relay.py +859 -0
  438. wandb/trigger.py +29 -0
  439. wandb/util.py +1915 -0
  440. wandb/vendor/__init__.py +0 -0
  441. wandb/vendor/gql-0.2.0/setup.py +40 -0
  442. wandb/vendor/gql-0.2.0/tests/__init__.py +0 -0
  443. wandb/vendor/gql-0.2.0/tests/starwars/__init__.py +0 -0
  444. wandb/vendor/gql-0.2.0/tests/starwars/fixtures.py +96 -0
  445. wandb/vendor/gql-0.2.0/tests/starwars/schema.py +146 -0
  446. wandb/vendor/gql-0.2.0/tests/starwars/test_dsl.py +293 -0
  447. wandb/vendor/gql-0.2.0/tests/starwars/test_query.py +355 -0
  448. wandb/vendor/gql-0.2.0/tests/starwars/test_validation.py +171 -0
  449. wandb/vendor/gql-0.2.0/tests/test_client.py +31 -0
  450. wandb/vendor/gql-0.2.0/tests/test_transport.py +89 -0
  451. wandb/vendor/gql-0.2.0/wandb_gql/__init__.py +4 -0
  452. wandb/vendor/gql-0.2.0/wandb_gql/client.py +75 -0
  453. wandb/vendor/gql-0.2.0/wandb_gql/dsl.py +152 -0
  454. wandb/vendor/gql-0.2.0/wandb_gql/gql.py +10 -0
  455. wandb/vendor/gql-0.2.0/wandb_gql/transport/__init__.py +0 -0
  456. wandb/vendor/gql-0.2.0/wandb_gql/transport/http.py +6 -0
  457. wandb/vendor/gql-0.2.0/wandb_gql/transport/local_schema.py +15 -0
  458. wandb/vendor/gql-0.2.0/wandb_gql/transport/requests.py +46 -0
  459. wandb/vendor/gql-0.2.0/wandb_gql/utils.py +21 -0
  460. wandb/vendor/graphql-core-1.1/setup.py +86 -0
  461. wandb/vendor/graphql-core-1.1/wandb_graphql/__init__.py +287 -0
  462. wandb/vendor/graphql-core-1.1/wandb_graphql/error/__init__.py +6 -0
  463. wandb/vendor/graphql-core-1.1/wandb_graphql/error/base.py +42 -0
  464. wandb/vendor/graphql-core-1.1/wandb_graphql/error/format_error.py +11 -0
  465. wandb/vendor/graphql-core-1.1/wandb_graphql/error/located_error.py +29 -0
  466. wandb/vendor/graphql-core-1.1/wandb_graphql/error/syntax_error.py +36 -0
  467. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/__init__.py +26 -0
  468. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/base.py +311 -0
  469. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executor.py +398 -0
  470. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executors/__init__.py +0 -0
  471. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executors/asyncio.py +53 -0
  472. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executors/gevent.py +22 -0
  473. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executors/process.py +32 -0
  474. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executors/sync.py +7 -0
  475. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executors/thread.py +35 -0
  476. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/executors/utils.py +6 -0
  477. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/experimental/__init__.py +0 -0
  478. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/experimental/executor.py +66 -0
  479. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/experimental/fragment.py +252 -0
  480. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/experimental/resolver.py +151 -0
  481. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/experimental/utils.py +7 -0
  482. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/middleware.py +57 -0
  483. wandb/vendor/graphql-core-1.1/wandb_graphql/execution/values.py +145 -0
  484. wandb/vendor/graphql-core-1.1/wandb_graphql/graphql.py +60 -0
  485. wandb/vendor/graphql-core-1.1/wandb_graphql/language/__init__.py +0 -0
  486. wandb/vendor/graphql-core-1.1/wandb_graphql/language/ast.py +1349 -0
  487. wandb/vendor/graphql-core-1.1/wandb_graphql/language/base.py +19 -0
  488. wandb/vendor/graphql-core-1.1/wandb_graphql/language/lexer.py +435 -0
  489. wandb/vendor/graphql-core-1.1/wandb_graphql/language/location.py +30 -0
  490. wandb/vendor/graphql-core-1.1/wandb_graphql/language/parser.py +779 -0
  491. wandb/vendor/graphql-core-1.1/wandb_graphql/language/printer.py +193 -0
  492. wandb/vendor/graphql-core-1.1/wandb_graphql/language/source.py +18 -0
  493. wandb/vendor/graphql-core-1.1/wandb_graphql/language/visitor.py +222 -0
  494. wandb/vendor/graphql-core-1.1/wandb_graphql/language/visitor_meta.py +82 -0
  495. wandb/vendor/graphql-core-1.1/wandb_graphql/pyutils/__init__.py +0 -0
  496. wandb/vendor/graphql-core-1.1/wandb_graphql/pyutils/cached_property.py +17 -0
  497. wandb/vendor/graphql-core-1.1/wandb_graphql/pyutils/contain_subset.py +28 -0
  498. wandb/vendor/graphql-core-1.1/wandb_graphql/pyutils/default_ordered_dict.py +40 -0
  499. wandb/vendor/graphql-core-1.1/wandb_graphql/pyutils/ordereddict.py +8 -0
  500. wandb/vendor/graphql-core-1.1/wandb_graphql/pyutils/pair_set.py +43 -0
  501. wandb/vendor/graphql-core-1.1/wandb_graphql/pyutils/version.py +78 -0
  502. wandb/vendor/graphql-core-1.1/wandb_graphql/type/__init__.py +67 -0
  503. wandb/vendor/graphql-core-1.1/wandb_graphql/type/definition.py +619 -0
  504. wandb/vendor/graphql-core-1.1/wandb_graphql/type/directives.py +132 -0
  505. wandb/vendor/graphql-core-1.1/wandb_graphql/type/introspection.py +440 -0
  506. wandb/vendor/graphql-core-1.1/wandb_graphql/type/scalars.py +131 -0
  507. wandb/vendor/graphql-core-1.1/wandb_graphql/type/schema.py +100 -0
  508. wandb/vendor/graphql-core-1.1/wandb_graphql/type/typemap.py +145 -0
  509. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/__init__.py +0 -0
  510. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/assert_valid_name.py +9 -0
  511. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/ast_from_value.py +65 -0
  512. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/ast_to_code.py +49 -0
  513. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/ast_to_dict.py +24 -0
  514. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/base.py +75 -0
  515. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/build_ast_schema.py +291 -0
  516. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/build_client_schema.py +250 -0
  517. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/concat_ast.py +9 -0
  518. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/extend_schema.py +357 -0
  519. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/get_field_def.py +27 -0
  520. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/get_operation_ast.py +21 -0
  521. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/introspection_query.py +90 -0
  522. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/is_valid_literal_value.py +67 -0
  523. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/is_valid_value.py +66 -0
  524. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/quoted_or_list.py +21 -0
  525. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/schema_printer.py +168 -0
  526. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/suggestion_list.py +56 -0
  527. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/type_comparators.py +69 -0
  528. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/type_from_ast.py +21 -0
  529. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/type_info.py +149 -0
  530. wandb/vendor/graphql-core-1.1/wandb_graphql/utils/value_from_ast.py +69 -0
  531. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/__init__.py +4 -0
  532. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/__init__.py +79 -0
  533. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/arguments_of_correct_type.py +24 -0
  534. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/base.py +8 -0
  535. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/default_values_of_correct_type.py +44 -0
  536. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/fields_on_correct_type.py +113 -0
  537. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/fragments_on_composite_types.py +33 -0
  538. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/known_argument_names.py +70 -0
  539. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/known_directives.py +97 -0
  540. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/known_fragment_names.py +19 -0
  541. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/known_type_names.py +43 -0
  542. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/lone_anonymous_operation.py +23 -0
  543. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/no_fragment_cycles.py +59 -0
  544. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/no_undefined_variables.py +36 -0
  545. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/no_unused_fragments.py +38 -0
  546. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/no_unused_variables.py +37 -0
  547. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/overlapping_fields_can_be_merged.py +529 -0
  548. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/possible_fragment_spreads.py +44 -0
  549. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/provided_non_null_arguments.py +46 -0
  550. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/scalar_leafs.py +33 -0
  551. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/unique_argument_names.py +32 -0
  552. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/unique_fragment_names.py +28 -0
  553. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/unique_input_field_names.py +33 -0
  554. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/unique_operation_names.py +31 -0
  555. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/unique_variable_names.py +27 -0
  556. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/variables_are_input_types.py +21 -0
  557. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/rules/variables_in_allowed_position.py +53 -0
  558. wandb/vendor/graphql-core-1.1/wandb_graphql/validation/validation.py +158 -0
  559. wandb/vendor/promise-2.3.0/conftest.py +30 -0
  560. wandb/vendor/promise-2.3.0/setup.py +64 -0
  561. wandb/vendor/promise-2.3.0/tests/__init__.py +0 -0
  562. wandb/vendor/promise-2.3.0/tests/conftest.py +8 -0
  563. wandb/vendor/promise-2.3.0/tests/test_awaitable.py +32 -0
  564. wandb/vendor/promise-2.3.0/tests/test_awaitable_35.py +47 -0
  565. wandb/vendor/promise-2.3.0/tests/test_benchmark.py +116 -0
  566. wandb/vendor/promise-2.3.0/tests/test_complex_threads.py +23 -0
  567. wandb/vendor/promise-2.3.0/tests/test_dataloader.py +452 -0
  568. wandb/vendor/promise-2.3.0/tests/test_dataloader_awaitable_35.py +99 -0
  569. wandb/vendor/promise-2.3.0/tests/test_dataloader_extra.py +65 -0
  570. wandb/vendor/promise-2.3.0/tests/test_extra.py +670 -0
  571. wandb/vendor/promise-2.3.0/tests/test_issues.py +132 -0
  572. wandb/vendor/promise-2.3.0/tests/test_promise_list.py +70 -0
  573. wandb/vendor/promise-2.3.0/tests/test_spec.py +584 -0
  574. wandb/vendor/promise-2.3.0/tests/test_thread_safety.py +115 -0
  575. wandb/vendor/promise-2.3.0/tests/utils.py +3 -0
  576. wandb/vendor/promise-2.3.0/wandb_promise/__init__.py +38 -0
  577. wandb/vendor/promise-2.3.0/wandb_promise/async_.py +135 -0
  578. wandb/vendor/promise-2.3.0/wandb_promise/compat.py +32 -0
  579. wandb/vendor/promise-2.3.0/wandb_promise/dataloader.py +326 -0
  580. wandb/vendor/promise-2.3.0/wandb_promise/iterate_promise.py +12 -0
  581. wandb/vendor/promise-2.3.0/wandb_promise/promise.py +848 -0
  582. wandb/vendor/promise-2.3.0/wandb_promise/promise_list.py +151 -0
  583. wandb/vendor/promise-2.3.0/wandb_promise/pyutils/__init__.py +0 -0
  584. wandb/vendor/promise-2.3.0/wandb_promise/pyutils/version.py +83 -0
  585. wandb/vendor/promise-2.3.0/wandb_promise/schedulers/__init__.py +0 -0
  586. wandb/vendor/promise-2.3.0/wandb_promise/schedulers/asyncio.py +22 -0
  587. wandb/vendor/promise-2.3.0/wandb_promise/schedulers/gevent.py +21 -0
  588. wandb/vendor/promise-2.3.0/wandb_promise/schedulers/immediate.py +27 -0
  589. wandb/vendor/promise-2.3.0/wandb_promise/schedulers/thread.py +18 -0
  590. wandb/vendor/promise-2.3.0/wandb_promise/utils.py +56 -0
  591. wandb/vendor/pygments/__init__.py +90 -0
  592. wandb/vendor/pygments/cmdline.py +568 -0
  593. wandb/vendor/pygments/console.py +74 -0
  594. wandb/vendor/pygments/filter.py +74 -0
  595. wandb/vendor/pygments/filters/__init__.py +350 -0
  596. wandb/vendor/pygments/formatter.py +95 -0
  597. wandb/vendor/pygments/formatters/__init__.py +153 -0
  598. wandb/vendor/pygments/formatters/_mapping.py +85 -0
  599. wandb/vendor/pygments/formatters/bbcode.py +109 -0
  600. wandb/vendor/pygments/formatters/html.py +851 -0
  601. wandb/vendor/pygments/formatters/img.py +600 -0
  602. wandb/vendor/pygments/formatters/irc.py +182 -0
  603. wandb/vendor/pygments/formatters/latex.py +482 -0
  604. wandb/vendor/pygments/formatters/other.py +160 -0
  605. wandb/vendor/pygments/formatters/rtf.py +147 -0
  606. wandb/vendor/pygments/formatters/svg.py +153 -0
  607. wandb/vendor/pygments/formatters/terminal.py +136 -0
  608. wandb/vendor/pygments/formatters/terminal256.py +309 -0
  609. wandb/vendor/pygments/lexer.py +871 -0
  610. wandb/vendor/pygments/lexers/__init__.py +329 -0
  611. wandb/vendor/pygments/lexers/_asy_builtins.py +1645 -0
  612. wandb/vendor/pygments/lexers/_cl_builtins.py +232 -0
  613. wandb/vendor/pygments/lexers/_cocoa_builtins.py +72 -0
  614. wandb/vendor/pygments/lexers/_csound_builtins.py +1346 -0
  615. wandb/vendor/pygments/lexers/_lasso_builtins.py +5327 -0
  616. wandb/vendor/pygments/lexers/_lua_builtins.py +295 -0
  617. wandb/vendor/pygments/lexers/_mapping.py +500 -0
  618. wandb/vendor/pygments/lexers/_mql_builtins.py +1172 -0
  619. wandb/vendor/pygments/lexers/_openedge_builtins.py +2547 -0
  620. wandb/vendor/pygments/lexers/_php_builtins.py +4756 -0
  621. wandb/vendor/pygments/lexers/_postgres_builtins.py +621 -0
  622. wandb/vendor/pygments/lexers/_scilab_builtins.py +3094 -0
  623. wandb/vendor/pygments/lexers/_sourcemod_builtins.py +1163 -0
  624. wandb/vendor/pygments/lexers/_stan_builtins.py +532 -0
  625. wandb/vendor/pygments/lexers/_stata_builtins.py +419 -0
  626. wandb/vendor/pygments/lexers/_tsql_builtins.py +1004 -0
  627. wandb/vendor/pygments/lexers/_vim_builtins.py +1939 -0
  628. wandb/vendor/pygments/lexers/actionscript.py +240 -0
  629. wandb/vendor/pygments/lexers/agile.py +24 -0
  630. wandb/vendor/pygments/lexers/algebra.py +221 -0
  631. wandb/vendor/pygments/lexers/ambient.py +76 -0
  632. wandb/vendor/pygments/lexers/ampl.py +87 -0
  633. wandb/vendor/pygments/lexers/apl.py +101 -0
  634. wandb/vendor/pygments/lexers/archetype.py +318 -0
  635. wandb/vendor/pygments/lexers/asm.py +641 -0
  636. wandb/vendor/pygments/lexers/automation.py +374 -0
  637. wandb/vendor/pygments/lexers/basic.py +500 -0
  638. wandb/vendor/pygments/lexers/bibtex.py +160 -0
  639. wandb/vendor/pygments/lexers/business.py +612 -0
  640. wandb/vendor/pygments/lexers/c_cpp.py +252 -0
  641. wandb/vendor/pygments/lexers/c_like.py +541 -0
  642. wandb/vendor/pygments/lexers/capnproto.py +78 -0
  643. wandb/vendor/pygments/lexers/chapel.py +102 -0
  644. wandb/vendor/pygments/lexers/clean.py +288 -0
  645. wandb/vendor/pygments/lexers/compiled.py +34 -0
  646. wandb/vendor/pygments/lexers/configs.py +833 -0
  647. wandb/vendor/pygments/lexers/console.py +114 -0
  648. wandb/vendor/pygments/lexers/crystal.py +393 -0
  649. wandb/vendor/pygments/lexers/csound.py +366 -0
  650. wandb/vendor/pygments/lexers/css.py +689 -0
  651. wandb/vendor/pygments/lexers/d.py +251 -0
  652. wandb/vendor/pygments/lexers/dalvik.py +125 -0
  653. wandb/vendor/pygments/lexers/data.py +555 -0
  654. wandb/vendor/pygments/lexers/diff.py +165 -0
  655. wandb/vendor/pygments/lexers/dotnet.py +691 -0
  656. wandb/vendor/pygments/lexers/dsls.py +878 -0
  657. wandb/vendor/pygments/lexers/dylan.py +289 -0
  658. wandb/vendor/pygments/lexers/ecl.py +125 -0
  659. wandb/vendor/pygments/lexers/eiffel.py +65 -0
  660. wandb/vendor/pygments/lexers/elm.py +121 -0
  661. wandb/vendor/pygments/lexers/erlang.py +533 -0
  662. wandb/vendor/pygments/lexers/esoteric.py +277 -0
  663. wandb/vendor/pygments/lexers/ezhil.py +69 -0
  664. wandb/vendor/pygments/lexers/factor.py +344 -0
  665. wandb/vendor/pygments/lexers/fantom.py +250 -0
  666. wandb/vendor/pygments/lexers/felix.py +273 -0
  667. wandb/vendor/pygments/lexers/forth.py +177 -0
  668. wandb/vendor/pygments/lexers/fortran.py +205 -0
  669. wandb/vendor/pygments/lexers/foxpro.py +428 -0
  670. wandb/vendor/pygments/lexers/functional.py +21 -0
  671. wandb/vendor/pygments/lexers/go.py +101 -0
  672. wandb/vendor/pygments/lexers/grammar_notation.py +213 -0
  673. wandb/vendor/pygments/lexers/graph.py +80 -0
  674. wandb/vendor/pygments/lexers/graphics.py +553 -0
  675. wandb/vendor/pygments/lexers/haskell.py +843 -0
  676. wandb/vendor/pygments/lexers/haxe.py +936 -0
  677. wandb/vendor/pygments/lexers/hdl.py +382 -0
  678. wandb/vendor/pygments/lexers/hexdump.py +103 -0
  679. wandb/vendor/pygments/lexers/html.py +602 -0
  680. wandb/vendor/pygments/lexers/idl.py +270 -0
  681. wandb/vendor/pygments/lexers/igor.py +288 -0
  682. wandb/vendor/pygments/lexers/inferno.py +96 -0
  683. wandb/vendor/pygments/lexers/installers.py +322 -0
  684. wandb/vendor/pygments/lexers/int_fiction.py +1343 -0
  685. wandb/vendor/pygments/lexers/iolang.py +63 -0
  686. wandb/vendor/pygments/lexers/j.py +146 -0
  687. wandb/vendor/pygments/lexers/javascript.py +1525 -0
  688. wandb/vendor/pygments/lexers/julia.py +333 -0
  689. wandb/vendor/pygments/lexers/jvm.py +1573 -0
  690. wandb/vendor/pygments/lexers/lisp.py +2621 -0
  691. wandb/vendor/pygments/lexers/make.py +202 -0
  692. wandb/vendor/pygments/lexers/markup.py +595 -0
  693. wandb/vendor/pygments/lexers/math.py +21 -0
  694. wandb/vendor/pygments/lexers/matlab.py +663 -0
  695. wandb/vendor/pygments/lexers/ml.py +769 -0
  696. wandb/vendor/pygments/lexers/modeling.py +358 -0
  697. wandb/vendor/pygments/lexers/modula2.py +1561 -0
  698. wandb/vendor/pygments/lexers/monte.py +204 -0
  699. wandb/vendor/pygments/lexers/ncl.py +894 -0
  700. wandb/vendor/pygments/lexers/nimrod.py +159 -0
  701. wandb/vendor/pygments/lexers/nit.py +64 -0
  702. wandb/vendor/pygments/lexers/nix.py +136 -0
  703. wandb/vendor/pygments/lexers/oberon.py +105 -0
  704. wandb/vendor/pygments/lexers/objective.py +504 -0
  705. wandb/vendor/pygments/lexers/ooc.py +85 -0
  706. wandb/vendor/pygments/lexers/other.py +41 -0
  707. wandb/vendor/pygments/lexers/parasail.py +79 -0
  708. wandb/vendor/pygments/lexers/parsers.py +835 -0
  709. wandb/vendor/pygments/lexers/pascal.py +644 -0
  710. wandb/vendor/pygments/lexers/pawn.py +199 -0
  711. wandb/vendor/pygments/lexers/perl.py +620 -0
  712. wandb/vendor/pygments/lexers/php.py +267 -0
  713. wandb/vendor/pygments/lexers/praat.py +294 -0
  714. wandb/vendor/pygments/lexers/prolog.py +306 -0
  715. wandb/vendor/pygments/lexers/python.py +939 -0
  716. wandb/vendor/pygments/lexers/qvt.py +152 -0
  717. wandb/vendor/pygments/lexers/r.py +453 -0
  718. wandb/vendor/pygments/lexers/rdf.py +270 -0
  719. wandb/vendor/pygments/lexers/rebol.py +431 -0
  720. wandb/vendor/pygments/lexers/resource.py +85 -0
  721. wandb/vendor/pygments/lexers/rnc.py +67 -0
  722. wandb/vendor/pygments/lexers/roboconf.py +82 -0
  723. wandb/vendor/pygments/lexers/robotframework.py +560 -0
  724. wandb/vendor/pygments/lexers/ruby.py +519 -0
  725. wandb/vendor/pygments/lexers/rust.py +220 -0
  726. wandb/vendor/pygments/lexers/sas.py +228 -0
  727. wandb/vendor/pygments/lexers/scripting.py +1222 -0
  728. wandb/vendor/pygments/lexers/shell.py +794 -0
  729. wandb/vendor/pygments/lexers/smalltalk.py +195 -0
  730. wandb/vendor/pygments/lexers/smv.py +79 -0
  731. wandb/vendor/pygments/lexers/snobol.py +83 -0
  732. wandb/vendor/pygments/lexers/special.py +103 -0
  733. wandb/vendor/pygments/lexers/sql.py +681 -0
  734. wandb/vendor/pygments/lexers/stata.py +108 -0
  735. wandb/vendor/pygments/lexers/supercollider.py +90 -0
  736. wandb/vendor/pygments/lexers/tcl.py +145 -0
  737. wandb/vendor/pygments/lexers/templates.py +2283 -0
  738. wandb/vendor/pygments/lexers/testing.py +207 -0
  739. wandb/vendor/pygments/lexers/text.py +25 -0
  740. wandb/vendor/pygments/lexers/textedit.py +169 -0
  741. wandb/vendor/pygments/lexers/textfmts.py +297 -0
  742. wandb/vendor/pygments/lexers/theorem.py +458 -0
  743. wandb/vendor/pygments/lexers/trafficscript.py +54 -0
  744. wandb/vendor/pygments/lexers/typoscript.py +226 -0
  745. wandb/vendor/pygments/lexers/urbi.py +133 -0
  746. wandb/vendor/pygments/lexers/varnish.py +190 -0
  747. wandb/vendor/pygments/lexers/verification.py +111 -0
  748. wandb/vendor/pygments/lexers/web.py +24 -0
  749. wandb/vendor/pygments/lexers/webmisc.py +988 -0
  750. wandb/vendor/pygments/lexers/whiley.py +116 -0
  751. wandb/vendor/pygments/lexers/x10.py +69 -0
  752. wandb/vendor/pygments/modeline.py +44 -0
  753. wandb/vendor/pygments/plugin.py +68 -0
  754. wandb/vendor/pygments/regexopt.py +92 -0
  755. wandb/vendor/pygments/scanner.py +105 -0
  756. wandb/vendor/pygments/sphinxext.py +158 -0
  757. wandb/vendor/pygments/style.py +155 -0
  758. wandb/vendor/pygments/styles/__init__.py +80 -0
  759. wandb/vendor/pygments/styles/abap.py +29 -0
  760. wandb/vendor/pygments/styles/algol.py +63 -0
  761. wandb/vendor/pygments/styles/algol_nu.py +63 -0
  762. wandb/vendor/pygments/styles/arduino.py +98 -0
  763. wandb/vendor/pygments/styles/autumn.py +65 -0
  764. wandb/vendor/pygments/styles/borland.py +51 -0
  765. wandb/vendor/pygments/styles/bw.py +49 -0
  766. wandb/vendor/pygments/styles/colorful.py +81 -0
  767. wandb/vendor/pygments/styles/default.py +73 -0
  768. wandb/vendor/pygments/styles/emacs.py +72 -0
  769. wandb/vendor/pygments/styles/friendly.py +72 -0
  770. wandb/vendor/pygments/styles/fruity.py +42 -0
  771. wandb/vendor/pygments/styles/igor.py +29 -0
  772. wandb/vendor/pygments/styles/lovelace.py +97 -0
  773. wandb/vendor/pygments/styles/manni.py +75 -0
  774. wandb/vendor/pygments/styles/monokai.py +106 -0
  775. wandb/vendor/pygments/styles/murphy.py +80 -0
  776. wandb/vendor/pygments/styles/native.py +65 -0
  777. wandb/vendor/pygments/styles/paraiso_dark.py +125 -0
  778. wandb/vendor/pygments/styles/paraiso_light.py +125 -0
  779. wandb/vendor/pygments/styles/pastie.py +75 -0
  780. wandb/vendor/pygments/styles/perldoc.py +69 -0
  781. wandb/vendor/pygments/styles/rainbow_dash.py +89 -0
  782. wandb/vendor/pygments/styles/rrt.py +33 -0
  783. wandb/vendor/pygments/styles/sas.py +44 -0
  784. wandb/vendor/pygments/styles/stata.py +40 -0
  785. wandb/vendor/pygments/styles/tango.py +141 -0
  786. wandb/vendor/pygments/styles/trac.py +63 -0
  787. wandb/vendor/pygments/styles/vim.py +63 -0
  788. wandb/vendor/pygments/styles/vs.py +38 -0
  789. wandb/vendor/pygments/styles/xcode.py +51 -0
  790. wandb/vendor/pygments/token.py +213 -0
  791. wandb/vendor/pygments/unistring.py +217 -0
  792. wandb/vendor/pygments/util.py +388 -0
  793. wandb/vendor/pynvml/__init__.py +0 -0
  794. wandb/vendor/pynvml/pynvml.py +4779 -0
  795. wandb/vendor/watchdog_0_9_0/wandb_watchdog/__init__.py +17 -0
  796. wandb/vendor/watchdog_0_9_0/wandb_watchdog/events.py +615 -0
  797. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/__init__.py +98 -0
  798. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/api.py +369 -0
  799. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/fsevents.py +172 -0
  800. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/fsevents2.py +239 -0
  801. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/inotify.py +218 -0
  802. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/inotify_buffer.py +81 -0
  803. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/inotify_c.py +575 -0
  804. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/kqueue.py +730 -0
  805. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/polling.py +145 -0
  806. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/read_directory_changes.py +133 -0
  807. wandb/vendor/watchdog_0_9_0/wandb_watchdog/observers/winapi.py +348 -0
  808. wandb/vendor/watchdog_0_9_0/wandb_watchdog/patterns.py +265 -0
  809. wandb/vendor/watchdog_0_9_0/wandb_watchdog/tricks/__init__.py +174 -0
  810. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/__init__.py +151 -0
  811. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/bricks.py +249 -0
  812. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/compat.py +29 -0
  813. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/decorators.py +198 -0
  814. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/delayed_queue.py +88 -0
  815. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/dirsnapshot.py +293 -0
  816. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/echo.py +157 -0
  817. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/event_backport.py +41 -0
  818. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/importlib2.py +40 -0
  819. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/platform.py +57 -0
  820. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/unicode_paths.py +64 -0
  821. wandb/vendor/watchdog_0_9_0/wandb_watchdog/utils/win32stat.py +123 -0
  822. wandb/vendor/watchdog_0_9_0/wandb_watchdog/version.py +28 -0
  823. wandb/vendor/watchdog_0_9_0/wandb_watchdog/watchmedo.py +577 -0
  824. wandb/viz.py +123 -0
  825. wandb/wandb_agent.py +586 -0
  826. wandb/wandb_controller.py +720 -0
  827. wandb/wandb_run.py +9 -0
  828. wandb/wandb_torch.py +550 -0
  829. wandb-0.17.0.dist-info/METADATA +217 -0
  830. wandb-0.17.0.dist-info/RECORD +833 -0
  831. wandb-0.17.0.dist-info/WHEEL +4 -0
  832. wandb-0.17.0.dist-info/entry_points.txt +3 -0
  833. wandb-0.17.0.dist-info/licenses/LICENSE +21 -0
@@ -0,0 +1,891 @@
1
+ """Implementation of KubernetesRunner class for wandb launch."""
2
+
3
+ import asyncio
4
+ import base64
5
+ import datetime
6
+ import json
7
+ import logging
8
+ import os
9
+ from typing import Any, Dict, Iterator, List, Optional, Tuple, Union
10
+
11
+ import yaml
12
+
13
+ import wandb
14
+ from wandb.apis.internal import Api
15
+ from wandb.sdk.launch.agent.agent import LaunchAgent
16
+ from wandb.sdk.launch.environment.abstract import AbstractEnvironment
17
+ from wandb.sdk.launch.registry.abstract import AbstractRegistry
18
+ from wandb.sdk.launch.registry.azure_container_registry import AzureContainerRegistry
19
+ from wandb.sdk.launch.registry.local_registry import LocalRegistry
20
+ from wandb.sdk.launch.runner.abstract import Status
21
+ from wandb.sdk.launch.runner.kubernetes_monitor import (
22
+ WANDB_K8S_LABEL_AGENT,
23
+ WANDB_K8S_LABEL_MONITOR,
24
+ WANDB_K8S_RUN_ID,
25
+ CustomResource,
26
+ LaunchKubernetesMonitor,
27
+ )
28
+ from wandb.sdk.lib.retry import ExponentialBackoff, retry_async
29
+ from wandb.util import get_module
30
+
31
+ from .._project_spec import EntryPoint, LaunchProject
32
+ from ..errors import LaunchError
33
+ from ..utils import (
34
+ LOG_PREFIX,
35
+ MAX_ENV_LENGTHS,
36
+ PROJECT_SYNCHRONOUS,
37
+ get_kube_context_and_api_client,
38
+ make_name_dns_safe,
39
+ )
40
+ from .abstract import AbstractRun, AbstractRunner
41
+
42
+ get_module(
43
+ "kubernetes_asyncio",
44
+ required="Kubernetes runner requires the kubernetes package. Please install it with `pip install wandb[launch]`.",
45
+ )
46
+
47
+ import kubernetes_asyncio # type: ignore # noqa: E402
48
+ from kubernetes_asyncio import client # noqa: E402
49
+ from kubernetes_asyncio.client.api.batch_v1_api import ( # type: ignore # noqa: E402
50
+ BatchV1Api,
51
+ )
52
+ from kubernetes_asyncio.client.api.core_v1_api import ( # type: ignore # noqa: E402
53
+ CoreV1Api,
54
+ )
55
+ from kubernetes_asyncio.client.api.custom_objects_api import ( # type: ignore # noqa: E402
56
+ CustomObjectsApi,
57
+ )
58
+ from kubernetes_asyncio.client.models.v1_secret import ( # type: ignore # noqa: E402
59
+ V1Secret,
60
+ )
61
+ from kubernetes_asyncio.client.rest import ApiException # type: ignore # noqa: E402
62
+
63
+ TIMEOUT = 5
64
+ API_KEY_SECRET_MAX_RETRIES = 5
65
+
66
+ _logger = logging.getLogger(__name__)
67
+
68
+
69
+ class KubernetesSubmittedRun(AbstractRun):
70
+ """Wrapper for a launched run on Kubernetes."""
71
+
72
+ def __init__(
73
+ self,
74
+ batch_api: "BatchV1Api",
75
+ core_api: "CoreV1Api",
76
+ name: str,
77
+ namespace: Optional[str] = "default",
78
+ secret: Optional["V1Secret"] = None,
79
+ ) -> None:
80
+ """Initialize a KubernetesSubmittedRun.
81
+
82
+ Other implementations of the AbstractRun interface poll on the run
83
+ when `get_status` is called, but KubernetesSubmittedRun uses
84
+ Kubernetes watch streams to update the run status. One thread handles
85
+ events from the job object and another thread handles events from the
86
+ rank 0 pod. These threads updated the `_status` attributed of the
87
+ KubernetesSubmittedRun object. When `get_status` is called, the
88
+ `_status` attribute is returned.
89
+
90
+ Arguments:
91
+ batch_api: Kubernetes BatchV1Api object.
92
+ core_api: Kubernetes CoreV1Api object.
93
+ name: Name of the job.
94
+ namespace: Kubernetes namespace.
95
+ secret: Kubernetes secret.
96
+
97
+ Returns:
98
+ None.
99
+ """
100
+ self.batch_api = batch_api
101
+ self.core_api = core_api
102
+ self.name = name
103
+ self.namespace = namespace
104
+ self._fail_count = 0
105
+ self.secret = secret
106
+
107
+ @property
108
+ def id(self) -> str:
109
+ """Return the run id."""
110
+ return self.name
111
+
112
+ async def get_logs(self) -> Optional[str]:
113
+ try:
114
+ pods = await self.core_api.list_namespaced_pod(
115
+ label_selector=f"job-name={self.name}", namespace=self.namespace
116
+ )
117
+ pod_names = [pi.metadata.name for pi in pods.items]
118
+ if not pod_names:
119
+ wandb.termwarn(f"Found no pods for kubernetes job: {self.name}")
120
+ return None
121
+ logs = await self.core_api.read_namespaced_pod_log(
122
+ name=pod_names[0], namespace=self.namespace
123
+ )
124
+ if logs:
125
+ return str(logs)
126
+ else:
127
+ wandb.termwarn(f"No logs for kubernetes pod(s): {pod_names}")
128
+ return None
129
+ except Exception as e:
130
+ wandb.termerror(f"{LOG_PREFIX}Failed to get pod logs: {e}")
131
+ return None
132
+
133
+ async def wait(self) -> bool:
134
+ """Wait for the run to finish.
135
+
136
+ Returns:
137
+ True if the run finished successfully, False otherwise.
138
+ """
139
+ while True:
140
+ status = await self.get_status()
141
+ wandb.termlog(f"{LOG_PREFIX}Job {self.name} status: {status.state}")
142
+ if status.state in ["finished", "failed", "preempted"]:
143
+ break
144
+ await asyncio.sleep(5)
145
+
146
+ await self._delete_secret()
147
+ return (
148
+ status.state == "finished"
149
+ ) # todo: not sure if this (copied from aws runner) is the right approach? should we return false on failure
150
+
151
+ async def get_status(self) -> Status:
152
+ status = LaunchKubernetesMonitor.get_status(self.name)
153
+ if status in ["stopped", "failed", "finished", "preempted"]:
154
+ await self._delete_secret()
155
+ return status
156
+
157
+ async def cancel(self) -> None:
158
+ """Cancel the run."""
159
+ try:
160
+ await self.batch_api.delete_namespaced_job(
161
+ namespace=self.namespace,
162
+ name=self.name,
163
+ )
164
+ await self._delete_secret()
165
+ except ApiException as e:
166
+ raise LaunchError(
167
+ f"Failed to delete Kubernetes Job {self.name} in namespace {self.namespace}: {str(e)}"
168
+ ) from e
169
+
170
+ async def _delete_secret(self) -> None:
171
+ # Cleanup secret if not running in a helm-managed context
172
+ if not os.environ.get("WANDB_RELEASE_NAME") and self.secret:
173
+ await self.core_api.delete_namespaced_secret(
174
+ name=self.secret.metadata.name,
175
+ namespace=self.secret.metadata.namespace,
176
+ )
177
+ self.secret = None
178
+
179
+
180
+ class CrdSubmittedRun(AbstractRun):
181
+ """Run submitted to a CRD backend, e.g. Volcano."""
182
+
183
+ def __init__(
184
+ self,
185
+ group: str,
186
+ version: str,
187
+ plural: str,
188
+ name: str,
189
+ namespace: str,
190
+ core_api: CoreV1Api,
191
+ custom_api: CustomObjectsApi,
192
+ ) -> None:
193
+ """Create a run object for tracking the progress of a CRD.
194
+
195
+ Arguments:
196
+ group: The API group of the CRD.
197
+ version: The API version of the CRD.
198
+ plural: The plural name of the CRD.
199
+ name: The name of the CRD instance.
200
+ namespace: The namespace of the CRD instance.
201
+ core_api: The Kubernetes core API client.
202
+ custom_api: The Kubernetes custom object API client.
203
+
204
+ Raises:
205
+ LaunchError: If the CRD instance does not exist.
206
+ """
207
+ self.group = group
208
+ self.version = version
209
+ self.plural = plural
210
+ self.name = name
211
+ self.namespace = namespace
212
+ self.core_api = core_api
213
+ self.custom_api = custom_api
214
+ self._fail_count = 0
215
+
216
+ @property
217
+ def id(self) -> str:
218
+ """Get the name of the custom object."""
219
+ return self.name
220
+
221
+ async def get_logs(self) -> Optional[str]:
222
+ """Get logs for custom object."""
223
+ # TODO: test more carefully once we release multi-node support
224
+ logs: Dict[str, Optional[str]] = {}
225
+ try:
226
+ pods = await self.core_api.list_namespaced_pod(
227
+ label_selector=f"wandb/run-id={self.name}", namespace=self.namespace
228
+ )
229
+ pod_names = [pi.metadata.name for pi in pods.items]
230
+ for pod_name in pod_names:
231
+ logs[pod_name] = await self.core_api.read_namespaced_pod_log(
232
+ name=pod_name, namespace=self.namespace
233
+ )
234
+ except ApiException as e:
235
+ wandb.termwarn(f"Failed to get logs for {self.name}: {str(e)}")
236
+ return None
237
+ if not logs:
238
+ return None
239
+ logs_as_array = [f"Pod {pod_name}:\n{log}" for pod_name, log in logs.items()]
240
+ return "\n".join(logs_as_array)
241
+
242
+ async def get_status(self) -> Status:
243
+ """Get status of custom object."""
244
+ return LaunchKubernetesMonitor.get_status(self.name)
245
+
246
+ async def cancel(self) -> None:
247
+ """Cancel the custom object."""
248
+ try:
249
+ await self.custom_api.delete_namespaced_custom_object(
250
+ group=self.group,
251
+ version=self.version,
252
+ namespace=self.namespace,
253
+ plural=self.plural,
254
+ name=self.name,
255
+ )
256
+ except ApiException as e:
257
+ raise LaunchError(
258
+ f"Failed to delete CRD {self.name} in namespace {self.namespace}: {str(e)}"
259
+ ) from e
260
+
261
+ async def wait(self) -> bool:
262
+ """Wait for this custom object to finish running."""
263
+ while True:
264
+ status = await self.get_status()
265
+ wandb.termlog(f"{LOG_PREFIX}Job {self.name} status: {status}")
266
+ if status.state in ["finished", "failed", "preempted"]:
267
+ return status.state == "finished"
268
+ await asyncio.sleep(5)
269
+
270
+
271
+ class KubernetesRunner(AbstractRunner):
272
+ """Launches runs onto kubernetes."""
273
+
274
+ def __init__(
275
+ self,
276
+ api: Api,
277
+ backend_config: Dict[str, Any],
278
+ environment: AbstractEnvironment,
279
+ registry: AbstractRegistry,
280
+ ) -> None:
281
+ """Create a Kubernetes runner.
282
+
283
+ Arguments:
284
+ api: The API client object.
285
+ backend_config: The backend configuration.
286
+ environment: The environment to launch runs into.
287
+
288
+ Raises:
289
+ LaunchError: If the Kubernetes configuration is invalid.
290
+ """
291
+ super().__init__(api, backend_config)
292
+ self.environment = environment
293
+ self.registry = registry
294
+
295
+ def get_namespace(
296
+ self, resource_args: Dict[str, Any], context: Dict[str, Any]
297
+ ) -> str:
298
+ """Get the namespace to launch into.
299
+
300
+ Arguments:
301
+ resource_args: The resource args to launch.
302
+ context: The k8s config context.
303
+
304
+ Returns:
305
+ The namespace to launch into.
306
+ """
307
+ default_namespace = (
308
+ context["context"].get("namespace", "default") if context else "default"
309
+ )
310
+ return ( # type: ignore[no-any-return]
311
+ resource_args.get("metadata", {}).get("namespace")
312
+ or resource_args.get(
313
+ "namespace"
314
+ ) # continue support for malformed namespace
315
+ or self.backend_config.get("runner", {}).get("namespace")
316
+ or default_namespace
317
+ )
318
+
319
+ async def _inject_defaults(
320
+ self,
321
+ resource_args: Dict[str, Any],
322
+ launch_project: LaunchProject,
323
+ image_uri: str,
324
+ namespace: str,
325
+ core_api: "CoreV1Api",
326
+ ) -> Tuple[Dict[str, Any], Optional["V1Secret"]]:
327
+ """Apply our default values, return job dict and api key secret.
328
+
329
+ Arguments:
330
+ resource_args (Dict[str, Any]): The resource args to launch.
331
+ launch_project (LaunchProject): The launch project.
332
+ builder (Optional[AbstractBuilder]): The builder.
333
+ namespace (str): The namespace.
334
+ core_api (CoreV1Api): The core api.
335
+
336
+ Returns:
337
+ Tuple[Dict[str, Any], Optional["V1Secret"]]: The resource args and api key secret.
338
+ """
339
+ job: Dict[str, Any] = {
340
+ "apiVersion": "batch/v1",
341
+ "kind": "Job",
342
+ }
343
+ job.update(resource_args)
344
+
345
+ job_metadata: Dict[str, Any] = job.get("metadata", {})
346
+ job_spec: Dict[str, Any] = {"backoffLimit": 0, "ttlSecondsAfterFinished": 60}
347
+ job_spec.update(job.get("spec", {}))
348
+ pod_template: Dict[str, Any] = job_spec.get("template", {})
349
+ pod_spec: Dict[str, Any] = {"restartPolicy": "Never"}
350
+ pod_spec.update(pod_template.get("spec", {}))
351
+ containers: List[Dict[str, Any]] = pod_spec.get("containers", [{}])
352
+
353
+ # Add labels to job metadata
354
+ job_metadata.setdefault("labels", {})
355
+ job_metadata["labels"][WANDB_K8S_RUN_ID] = launch_project.run_id
356
+ job_metadata["labels"][WANDB_K8S_LABEL_MONITOR] = "true"
357
+ if LaunchAgent.initialized():
358
+ job_metadata["labels"][WANDB_K8S_LABEL_AGENT] = LaunchAgent.name()
359
+ # name precedence: name in spec > generated name
360
+ if not job_metadata.get("name"):
361
+ job_metadata["generateName"] = make_name_dns_safe(
362
+ f"launch-{launch_project.target_entity}-{launch_project.target_project}-"
363
+ )
364
+
365
+ for i, cont in enumerate(containers):
366
+ if "name" not in cont:
367
+ cont["name"] = cont.get("name", "launch" + str(i))
368
+ if "securityContext" not in cont:
369
+ cont["securityContext"] = {
370
+ "allowPrivilegeEscalation": False,
371
+ "capabilities": {"drop": ["ALL"]},
372
+ "seccompProfile": {"type": "RuntimeDefault"},
373
+ }
374
+
375
+ entry_point = (
376
+ launch_project.override_entrypoint or launch_project.get_job_entry_point()
377
+ )
378
+ if launch_project.docker_image:
379
+ # dont specify run id if user provided image, could have multiple runs
380
+ containers[0]["image"] = image_uri
381
+ # TODO: handle secret pulling image from registry
382
+ elif not any(["image" in cont for cont in containers]):
383
+ assert entry_point is not None
384
+ # in the non instance case we need to make an imagePullSecret
385
+ # so the new job can pull the image
386
+ containers[0]["image"] = image_uri
387
+ secret = await maybe_create_imagepull_secret(
388
+ core_api, self.registry, launch_project.run_id, namespace
389
+ )
390
+ if secret is not None:
391
+ pod_spec["imagePullSecrets"] = [
392
+ {"name": f"regcred-{launch_project.run_id}"}
393
+ ]
394
+
395
+ inject_entrypoint_and_args(
396
+ containers,
397
+ entry_point,
398
+ launch_project.override_args,
399
+ launch_project.override_entrypoint is not None,
400
+ )
401
+
402
+ env_vars = launch_project.get_env_vars_dict(
403
+ self._api, MAX_ENV_LENGTHS[self.__class__.__name__]
404
+ )
405
+ api_key_secret = None
406
+ for cont in containers:
407
+ # Add our env vars to user supplied env vars
408
+ env = cont.get("env") or []
409
+ for key, value in env_vars.items():
410
+ if (
411
+ key == "WANDB_API_KEY"
412
+ and value
413
+ and (
414
+ LaunchAgent.initialized()
415
+ or self.backend_config[PROJECT_SYNCHRONOUS]
416
+ )
417
+ ):
418
+ # Override API key with secret. TODO: Do the same for other runners
419
+ release_name = os.environ.get("WANDB_RELEASE_NAME")
420
+ secret_name = "wandb-api-key"
421
+ if release_name:
422
+ secret_name += f"-{release_name}"
423
+ else:
424
+ secret_name += f"-{launch_project.run_id}"
425
+
426
+ def handle_exception(e):
427
+ wandb.termwarn(
428
+ f"Exception when ensuring Kubernetes API key secret: {e}. Retrying..."
429
+ )
430
+
431
+ api_key_secret = await retry_async(
432
+ backoff=ExponentialBackoff(
433
+ initial_sleep=datetime.timedelta(seconds=1),
434
+ max_sleep=datetime.timedelta(minutes=1),
435
+ max_retries=API_KEY_SECRET_MAX_RETRIES,
436
+ ),
437
+ fn=ensure_api_key_secret,
438
+ on_exc=handle_exception,
439
+ core_api=core_api,
440
+ secret_name=secret_name,
441
+ namespace=namespace,
442
+ api_key=value,
443
+ )
444
+ env.append(
445
+ {
446
+ "name": key,
447
+ "valueFrom": {
448
+ "secretKeyRef": {
449
+ "name": secret_name,
450
+ "key": "password",
451
+ }
452
+ },
453
+ }
454
+ )
455
+ else:
456
+ env.append({"name": key, "value": value})
457
+ cont["env"] = env
458
+
459
+ pod_spec["containers"] = containers
460
+ pod_template["spec"] = pod_spec
461
+ job_spec["template"] = pod_template
462
+ job["spec"] = job_spec
463
+ job["metadata"] = job_metadata
464
+
465
+ add_label_to_pods(
466
+ job,
467
+ WANDB_K8S_LABEL_MONITOR,
468
+ "true",
469
+ )
470
+
471
+ # Add wandb.ai/agent: current agent label on all pods
472
+ if LaunchAgent.initialized():
473
+ add_label_to_pods(
474
+ job,
475
+ WANDB_K8S_LABEL_AGENT,
476
+ LaunchAgent.name(),
477
+ )
478
+
479
+ return job, api_key_secret
480
+
481
+ async def run(
482
+ self, launch_project: LaunchProject, image_uri: str
483
+ ) -> Optional[AbstractRun]: # noqa: C901
484
+ """Execute a launch project on Kubernetes.
485
+
486
+ Arguments:
487
+ launch_project: The launch project to execute.
488
+ builder: The builder to use to build the image.
489
+
490
+ Returns:
491
+ The run object if the run was successful, otherwise None.
492
+ """
493
+ await LaunchKubernetesMonitor.ensure_initialized()
494
+ resource_args = launch_project.fill_macros(image_uri).get("kubernetes", {})
495
+ if not resource_args:
496
+ wandb.termlog(
497
+ f"{LOG_PREFIX}Note: no resource args specified. Add a "
498
+ "Kubernetes yaml spec or other options in a json file "
499
+ "with --resource-args <json>."
500
+ )
501
+ _logger.info(f"Running Kubernetes job with resource args: {resource_args}")
502
+
503
+ context, api_client = await get_kube_context_and_api_client(
504
+ kubernetes_asyncio, resource_args
505
+ )
506
+
507
+ # If the user specified an alternate api, we need will execute this
508
+ # run by creating a custom object.
509
+ api_version = resource_args.get("apiVersion", "batch/v1")
510
+
511
+ if api_version not in ["batch/v1", "batch/v1beta1"]:
512
+ env_vars = launch_project.get_env_vars_dict(
513
+ self._api, MAX_ENV_LENGTHS[self.__class__.__name__]
514
+ )
515
+ # Crawl the resource args and add our env vars to the containers.
516
+ add_wandb_env(resource_args, env_vars)
517
+
518
+ # Add our labels to the resource args. This is necessary for the
519
+ # agent to find the custom object later on.
520
+ resource_args["metadata"] = resource_args.get("metadata", {})
521
+ resource_args["metadata"]["labels"] = resource_args["metadata"].get(
522
+ "labels", {}
523
+ )
524
+ resource_args["metadata"]["labels"][WANDB_K8S_LABEL_MONITOR] = "true"
525
+
526
+ # Crawl the resource arsg and add our labels to the pods. This is
527
+ # necessary for the agent to find the pods later on.
528
+ add_label_to_pods(
529
+ resource_args,
530
+ WANDB_K8S_LABEL_MONITOR,
531
+ "true",
532
+ )
533
+
534
+ # Add wandb.ai/agent: current agent label on all pods
535
+ if LaunchAgent.initialized():
536
+ add_label_to_pods(
537
+ resource_args,
538
+ WANDB_K8S_LABEL_MONITOR,
539
+ LaunchAgent.name(),
540
+ )
541
+ resource_args["metadata"]["labels"][WANDB_K8S_LABEL_AGENT] = (
542
+ LaunchAgent.name()
543
+ )
544
+
545
+ overrides = {}
546
+ if launch_project.override_args:
547
+ overrides["args"] = launch_project.override_args
548
+ if launch_project.override_entrypoint:
549
+ overrides["command"] = launch_project.override_entrypoint.command
550
+ add_entrypoint_args_overrides(
551
+ resource_args,
552
+ overrides,
553
+ )
554
+ api = client.CustomObjectsApi(api_client)
555
+ # Infer the attributes of a custom object from the apiVersion and/or
556
+ # a kind: attribute in the resource args.
557
+ namespace = self.get_namespace(resource_args, context)
558
+ group, version, *_ = api_version.split("/")
559
+ group = resource_args.get("group", group)
560
+ version = resource_args.get("version", version)
561
+ kind = resource_args.get("kind", version)
562
+ plural = f"{kind.lower()}s"
563
+ custom_resource = CustomResource(
564
+ group=group,
565
+ version=version,
566
+ plural=plural,
567
+ )
568
+ LaunchKubernetesMonitor.monitor_namespace(
569
+ namespace, custom_resource=custom_resource
570
+ )
571
+
572
+ try:
573
+ response = await api.create_namespaced_custom_object(
574
+ group=group,
575
+ version=version,
576
+ namespace=namespace,
577
+ plural=plural,
578
+ body=resource_args,
579
+ )
580
+ except ApiException as e:
581
+ body = json.loads(e.body)
582
+ body_yaml = yaml.dump(body)
583
+ raise LaunchError(
584
+ f"Error creating CRD of kind {kind}: {e.status} {e.reason}\n{body_yaml}"
585
+ ) from e
586
+ name = response.get("metadata", {}).get("name")
587
+ _logger.info(f"Created {kind} {response['metadata']['name']}")
588
+ submitted_run = CrdSubmittedRun(
589
+ name=name,
590
+ group=group,
591
+ version=version,
592
+ namespace=namespace,
593
+ plural=plural,
594
+ core_api=client.CoreV1Api(api_client),
595
+ custom_api=api,
596
+ )
597
+ if self.backend_config[PROJECT_SYNCHRONOUS]:
598
+ await submitted_run.wait()
599
+ return submitted_run
600
+
601
+ batch_api = kubernetes_asyncio.client.BatchV1Api(api_client)
602
+ core_api = kubernetes_asyncio.client.CoreV1Api(api_client)
603
+ namespace = self.get_namespace(resource_args, context)
604
+ job, secret = await self._inject_defaults(
605
+ resource_args, launch_project, image_uri, namespace, core_api
606
+ )
607
+ msg = "Creating Kubernetes job"
608
+ if "name" in resource_args:
609
+ msg += f": {resource_args['name']}"
610
+ _logger.info(msg)
611
+ try:
612
+ response = await kubernetes_asyncio.utils.create_from_dict(
613
+ api_client, job, namespace=namespace
614
+ )
615
+ except kubernetes_asyncio.utils.FailToCreateError as e:
616
+ for exc in e.api_exceptions:
617
+ resp = json.loads(exc.body)
618
+ msg = resp.get("message")
619
+ code = resp.get("code")
620
+ raise LaunchError(
621
+ f"Failed to create Kubernetes job for run {launch_project.run_id} ({code} {exc.reason}): {msg}"
622
+ )
623
+ except Exception as e:
624
+ raise LaunchError(
625
+ f"Unexpected exception when creating Kubernetes job: {str(e)}\n"
626
+ )
627
+ job_response = response[0]
628
+ job_name = job_response.metadata.name
629
+ LaunchKubernetesMonitor.monitor_namespace(namespace)
630
+ submitted_job = KubernetesSubmittedRun(
631
+ batch_api, core_api, job_name, namespace, secret
632
+ )
633
+ if self.backend_config[PROJECT_SYNCHRONOUS]:
634
+ await submitted_job.wait()
635
+
636
+ return submitted_job
637
+
638
+
639
+ def inject_entrypoint_and_args(
640
+ containers: List[dict],
641
+ entry_point: Optional[EntryPoint],
642
+ override_args: List[str],
643
+ should_override_entrypoint: bool,
644
+ ) -> None:
645
+ """Inject the entrypoint and args into the containers.
646
+
647
+ Arguments:
648
+ containers: The containers to inject the entrypoint and args into.
649
+ entry_point: The entrypoint to inject.
650
+ override_args: The args to inject.
651
+ should_override_entrypoint: Whether to override the entrypoint.
652
+
653
+ Returns:
654
+ None
655
+ """
656
+ for i in range(len(containers)):
657
+ if override_args:
658
+ containers[i]["args"] = override_args
659
+ if entry_point and (
660
+ not containers[i].get("command") or should_override_entrypoint
661
+ ):
662
+ containers[i]["command"] = entry_point.command
663
+
664
+
665
+ async def ensure_api_key_secret(
666
+ core_api: "CoreV1Api",
667
+ secret_name: str,
668
+ namespace: str,
669
+ api_key: str,
670
+ ) -> "V1Secret":
671
+ """Create a secret containing a user's wandb API key.
672
+
673
+ Arguments:
674
+ core_api: The Kubernetes CoreV1Api object.
675
+ secret_name: The name to use for the secret.
676
+ namespace: The namespace to create the secret in.
677
+ api_key: The user's wandb API key
678
+
679
+ Returns:
680
+ The created secret
681
+ """
682
+ secret_data = {"password": base64.b64encode(api_key.encode()).decode()}
683
+ labels = {"wandb.ai/created-by": "launch-agent"}
684
+ secret = client.V1Secret(
685
+ data=secret_data,
686
+ metadata=client.V1ObjectMeta(
687
+ name=secret_name, namespace=namespace, labels=labels
688
+ ),
689
+ kind="Secret",
690
+ type="kubernetes.io/basic-auth",
691
+ )
692
+
693
+ try:
694
+ try:
695
+ return await core_api.create_namespaced_secret(namespace, secret)
696
+ except ApiException as e:
697
+ # 409 = conflict = secret already exists
698
+ if e.status == 409:
699
+ existing_secret = await core_api.read_namespaced_secret(
700
+ name=secret_name, namespace=namespace
701
+ )
702
+ if existing_secret.data != secret_data:
703
+ # If it's a previous secret made by launch agent, clean it up
704
+ if (
705
+ existing_secret.metadata.labels.get("wandb.ai/created-by")
706
+ == "launch-agent"
707
+ ):
708
+ await core_api.delete_namespaced_secret(
709
+ name=secret_name, namespace=namespace
710
+ )
711
+ return await core_api.create_namespaced_secret(
712
+ namespace, secret
713
+ )
714
+ else:
715
+ raise LaunchError(
716
+ f"Kubernetes secret already exists in namespace {namespace} with incorrect data: {secret_name}"
717
+ )
718
+ return existing_secret
719
+ raise
720
+ except Exception as e:
721
+ raise LaunchError(
722
+ f"Exception when ensuring Kubernetes API key secret: {str(e)}\n"
723
+ )
724
+
725
+
726
+ async def maybe_create_imagepull_secret(
727
+ core_api: "CoreV1Api",
728
+ registry: AbstractRegistry,
729
+ run_id: str,
730
+ namespace: str,
731
+ ) -> Optional["V1Secret"]:
732
+ """Create a secret for pulling images from a private registry.
733
+
734
+ Arguments:
735
+ core_api: The Kubernetes CoreV1Api object.
736
+ registry: The registry to pull from.
737
+ run_id: The run id.
738
+ namespace: The namespace to create the secret in.
739
+
740
+ Returns:
741
+ A secret if one was created, otherwise None.
742
+ """
743
+ secret = None
744
+ if isinstance(registry, LocalRegistry) or isinstance(
745
+ registry, AzureContainerRegistry
746
+ ):
747
+ # Secret not required
748
+ return None
749
+ uname, token = await registry.get_username_password()
750
+ creds_info = {
751
+ "auths": {
752
+ registry.uri: {
753
+ "auth": base64.b64encode(f"{uname}:{token}".encode()).decode(),
754
+ # need an email but the use is deprecated
755
+ "email": "deprecated@wandblaunch.com",
756
+ }
757
+ }
758
+ }
759
+ secret_data = {
760
+ ".dockerconfigjson": base64.b64encode(json.dumps(creds_info).encode()).decode()
761
+ }
762
+ secret = client.V1Secret(
763
+ data=secret_data,
764
+ metadata=client.V1ObjectMeta(name=f"regcred-{run_id}", namespace=namespace),
765
+ kind="Secret",
766
+ type="kubernetes.io/dockerconfigjson",
767
+ )
768
+ try:
769
+ try:
770
+ return await core_api.create_namespaced_secret(namespace, secret)
771
+ except ApiException as e:
772
+ # 409 = conflict = secret already exists
773
+ if e.status == 409:
774
+ return await core_api.read_namespaced_secret(
775
+ name=f"regcred-{run_id}", namespace=namespace
776
+ )
777
+ raise
778
+ except Exception as e:
779
+ raise LaunchError(f"Exception when creating Kubernetes secret: {str(e)}\n")
780
+
781
+
782
+ def yield_containers(root: Any) -> Iterator[dict]:
783
+ """Yield all container specs in a manifest.
784
+
785
+ Recursively traverses the manifest and yields all container specs. Container
786
+ specs are identified by the presence of a "containers" key in the value.
787
+ """
788
+ if isinstance(root, dict):
789
+ for k, v in root.items():
790
+ if k == "containers":
791
+ if isinstance(v, list):
792
+ yield from v
793
+ elif isinstance(v, (dict, list)):
794
+ yield from yield_containers(v)
795
+ elif isinstance(root, list):
796
+ for item in root:
797
+ yield from yield_containers(item)
798
+
799
+
800
+ def add_wandb_env(root: Union[dict, list], env_vars: Dict[str, str]) -> None:
801
+ """Injects wandb environment variables into specs.
802
+
803
+ Recursively walks the spec and injects the environment variables into
804
+ every container spec. Containers are identified by the "containers" key.
805
+
806
+ This function treats the WANDB_RUN_ID and WANDB_GROUP_ID environment variables
807
+ specially. If they are present in the spec, they will be overwritten. If a setting
808
+ for WANDB_RUN_ID is provided in env_vars, then that environment variable will only be
809
+ set in the first container modified by this function.
810
+
811
+ Arguments:
812
+ root: The spec to modify.
813
+ env_vars: The environment variables to inject.
814
+
815
+ Returns: None.
816
+ """
817
+ for cont in yield_containers(root):
818
+ env = cont.setdefault("env", [])
819
+ env.extend([{"name": key, "value": value} for key, value in env_vars.items()])
820
+ cont["env"] = env
821
+ # After we have set WANDB_RUN_ID once, we don't want to set it again
822
+ if "WANDB_RUN_ID" in env_vars:
823
+ env_vars.pop("WANDB_RUN_ID")
824
+
825
+
826
+ def yield_pods(manifest: Any) -> Iterator[dict]:
827
+ """Yield all pod specs in a manifest.
828
+
829
+ Recursively traverses the manifest and yields all pod specs. Pod specs are
830
+ identified by the presence of a "spec" key with a "containers" key in the
831
+ value.
832
+ """
833
+ if isinstance(manifest, list):
834
+ for item in manifest:
835
+ yield from yield_pods(item)
836
+ elif isinstance(manifest, dict):
837
+ if "spec" in manifest and "containers" in manifest["spec"]:
838
+ yield manifest
839
+ for value in manifest.values():
840
+ if isinstance(value, (dict, list)):
841
+ yield from yield_pods(value)
842
+
843
+
844
+ def add_label_to_pods(
845
+ manifest: Union[dict, list], label_key: str, label_value: str
846
+ ) -> None:
847
+ """Add a label to all pod specs in a manifest.
848
+
849
+ Recursively traverses the manifest and adds the label to all pod specs.
850
+ Pod specs are identified by the presence of a "spec" key with a "containers"
851
+ key in the value.
852
+
853
+ Arguments:
854
+ manifest: The manifest to modify.
855
+ label_key: The label key to add.
856
+ label_value: The label value to add.
857
+
858
+ Returns: None.
859
+ """
860
+ for pod in yield_pods(manifest):
861
+ metadata = pod.setdefault("metadata", {})
862
+ labels = metadata.setdefault("labels", {})
863
+ labels[label_key] = label_value
864
+
865
+
866
+ def add_entrypoint_args_overrides(manifest: Union[dict, list], overrides: dict) -> None:
867
+ """Add entrypoint and args overrides to all containers in a manifest.
868
+
869
+ Recursively traverses the manifest and adds the entrypoint and args overrides
870
+ to all containers. Containers are identified by the presence of a "spec" key
871
+ with a "containers" key in the value.
872
+
873
+ Arguments:
874
+ manifest: The manifest to modify.
875
+ overrides: Dictionary with args and entrypoint keys.
876
+
877
+ Returns: None.
878
+ """
879
+ if isinstance(manifest, list):
880
+ for item in manifest:
881
+ add_entrypoint_args_overrides(item, overrides)
882
+ elif isinstance(manifest, dict):
883
+ if "spec" in manifest and "containers" in manifest["spec"]:
884
+ containers = manifest["spec"]["containers"]
885
+ for container in containers:
886
+ if "command" in overrides:
887
+ container["command"] = overrides["command"]
888
+ if "args" in overrides:
889
+ container["args"] = overrides["args"]
890
+ for value in manifest.values():
891
+ add_entrypoint_args_overrides(value, overrides)