idc-index-data 22.1.5__tar.gz → 23.0.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (38) hide show
  1. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/PKG-INFO +1 -1
  2. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/assets/clinical_index.sql +1 -1
  3. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/assets/sm_index.sql +4 -2
  4. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/assets/sm_instance_index.sql +2 -2
  5. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/pyproject.toml +1 -1
  6. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/scripts/python/idc_index_data_manager.py +1 -1
  7. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/scripts/sql/analysis_results_index.sql +1 -1
  8. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/scripts/sql/collections_index.sql +1 -1
  9. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/scripts/sql/idc_index.sql +7 -3
  10. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/scripts/sql/prior_versions_index.sql +1 -1
  11. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/tests/test_package.py +1 -1
  12. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/.git_archival.txt +0 -0
  13. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/.gitattributes +0 -0
  14. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/.github/CONTRIBUTING.md +0 -0
  15. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/.github/copilot-instructions.md +0 -0
  16. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/.github/dependabot.yml +0 -0
  17. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/.github/matchers/pylint.json +0 -0
  18. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/.github/workflows/cd.yml +0 -0
  19. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/.github/workflows/ci.yml +0 -0
  20. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/.github/workflows/external-indices.yml +0 -0
  21. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/.gitignore +0 -0
  22. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/.pre-commit-config.yaml +0 -0
  23. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/.readthedocs.yaml +0 -0
  24. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/CMakeLists.txt +0 -0
  25. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/LICENSE +0 -0
  26. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/README.md +0 -0
  27. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/assets/README.md +0 -0
  28. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/docs/conf.py +0 -0
  29. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/docs/index.md +0 -0
  30. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/noxfile.py +0 -0
  31. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/pytest.ini +0 -0
  32. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/scripts/python/generate-indices.py +0 -0
  33. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/scripts/python/update_idc_index_version.py +0 -0
  34. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/src/idc_index_data/__init__.py +0 -0
  35. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/src/idc_index_data/_version.pyi +0 -0
  36. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/src/idc_index_data/py.typed +0 -0
  37. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/tests/test_column_description_parser.py +0 -0
  38. {idc_index_data-22.1.5 → idc_index_data-23.0.1}/tests/test_real_sql_parsing.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: idc-index-data
3
- Version: 22.1.5
3
+ Version: 23.0.1
4
4
  Summary: ImagingDataCommons index to query and download data.
5
5
  Author-Email: Andrey Fedorov <andrey.fedorov@gmail.com>, Vamsi Thiriveedhi <vthiriveedhi@mgh.harvard.edu>, Jean-Christophe Fillion-Robin <jchris.fillionr@kitware.com>
6
6
  License: Copyright 2024 Andrey Fedorov
@@ -25,6 +25,6 @@ SELECT
25
25
  # values encountered in the column
26
26
  `values`
27
27
  FROM
28
- `bigquery-public-data.idc_v22_clinical.column_metadata`
28
+ `bigquery-public-data.idc_v23_clinical.column_metadata`
29
29
  ORDER BY
30
30
  collection_id, table_name
@@ -37,7 +37,7 @@ WITH
37
37
 
38
38
 
39
39
  FROM
40
- `bigquery-public-data.idc_v22.dicom_all` AS dicom_all
40
+ `bigquery-public-data.idc_v23.dicom_all` AS dicom_all
41
41
  GROUP BY
42
42
  SeriesInstanceUID
43
43
  ),
@@ -51,7 +51,7 @@ SpecimenPreparationSequence_unnested AS (
51
51
  concept_code_sequence.CodeMeaning AS ccs_cm,
52
52
  concept_code_sequence.CodingSchemeDesignator AS ccs_csd,
53
53
  concept_code_sequence.CodeValue AS ccs_val,
54
- FROM `bigquery-public-data.idc_v22.dicom_all`,
54
+ FROM `bigquery-public-data.idc_v23.dicom_all`,
55
55
  UNNEST(SpecimenDescriptionSequence[SAFE_OFFSET(0)].SpecimenPreparationSequence) as preparation_unnest_step1,
56
56
  UNNEST(preparation_unnest_step1.SpecimenPreparationStepContentItemSequence) as preparation_unnest_step2,
57
57
  UNNEST(preparation_unnest_step2.ConceptNameCodeSequence) as concept_name_code_sequence,
@@ -86,6 +86,8 @@ SpecimenPreparationSequence_unnested AS (
86
86
  )
87
87
 
88
88
  SELECT
89
+ # description:
90
+ # DICOM SeriesInstanceUID identifier of the series
89
91
  temp_table.SeriesInstanceUID,
90
92
  -- Embedding Medium
91
93
  # description:
@@ -16,7 +16,7 @@ WITH
16
16
  concept_code_sequence.CodingSchemeDesignator AS ccs_csd,
17
17
  concept_code_sequence.CodeValue AS ccs_val,
18
18
  FROM
19
- `bigquery-public-data.idc_v22.dicom_all`,
19
+ `bigquery-public-data.idc_v23.dicom_all`,
20
20
  UNNEST(SpecimenDescriptionSequence[SAFE_OFFSET(0)].SpecimenPreparationSequence) AS preparation_unnest_step1,
21
21
  UNNEST(preparation_unnest_step1.SpecimenPreparationStepContentItemSequence) AS preparation_unnest_step2,
22
22
  UNNEST(preparation_unnest_step2.ConceptNameCodeSequence) AS concept_name_code_sequence,
@@ -144,7 +144,7 @@ SELECT
144
144
  # unique identifier of the instance within the IDC
145
145
  dicom_all.crdc_instance_uuid AS crdc_instance_uuid
146
146
  FROM
147
- `bigquery-public-data.idc_v22.dicom_all` AS dicom_all
147
+ `bigquery-public-data.idc_v23.dicom_all` AS dicom_all
148
148
  LEFT JOIN
149
149
  slide_embedding
150
150
  ON
@@ -13,7 +13,7 @@ build-backend = "scikit_build_core.build"
13
13
 
14
14
  [project]
15
15
  name = "idc-index-data"
16
- version = "22.1.5"
16
+ version = "23.0.1"
17
17
  authors = [
18
18
  { name = "Andrey Fedorov", email = "andrey.fedorov@gmail.com" },
19
19
  { name = "Vamsi Thiriveedhi", email = "vthiriveedhi@mgh.harvard.edu" },
@@ -423,7 +423,7 @@ class IDCIndexDataManager:
423
423
  SELECT
424
424
  MAX(idc_version) AS latest_idc_release_version
425
425
  FROM
426
- `bigquery-public-data.idc_current.version_metadata`
426
+ `bigquery-public-data.idc_v23.version_metadata`
427
427
  """
428
428
  query_job = self.client.query(query)
429
429
  result = query_job.result()
@@ -43,4 +43,4 @@ SELECT
43
43
  # citation for the analysis results collection that should be used for acknowledgment
44
44
  Citation
45
45
  FROM
46
- `bigquery-public-data.idc_v22.analysis_results_metadata`
46
+ `bigquery-public-data.idc_v23.analysis_results_metadata`
@@ -40,4 +40,4 @@ SELECT
40
40
  # detailed information about the collection
41
41
  Description
42
42
  FROM
43
- `bigquery-public-data.idc_v22.original_collections_metadata`
43
+ `bigquery-public-data.idc_v23.original_collections_metadata`
@@ -1,3 +1,7 @@
1
+ # table-description:
2
+ # This is the main metadata table provided by idc-index. Each row corresponds to a DICOM series, and contains
3
+ # attributes at the collection, patient, study, and series levels. The table also contains download-related
4
+ # attributes, such as the AWS S3 bucket and URL to download the series.
1
5
  SELECT
2
6
  # collection level attributes
3
7
  # description:
@@ -22,7 +26,7 @@ SELECT
22
26
  # series; follow this DOI to learn more about the activity that produced
23
27
  # this series
24
28
  ANY_VALUE(source_DOI) AS source_DOI,
25
- # patient level attributes
29
+ # patient level attributes:
26
30
  # description:
27
31
  # age of the subject at the time of imaging (DICOM attribute)
28
32
  ANY_VALUE(PatientAge) AS PatientAge,
@@ -79,9 +83,9 @@ SELECT
79
83
  # total size of the series in megabytes
80
84
  ROUND(SUM(SAFE_CAST(instance_size AS float64))/1000000, 2) AS series_size_MB,
81
85
  FROM
82
- `bigquery-public-data.idc_v22.dicom_all` AS dicom_all
86
+ `bigquery-public-data.idc_v23.dicom_all` AS dicom_all
83
87
  JOIN
84
- `bigquery-public-data.idc_v22.dicom_metadata_curated` AS dicom_curated
88
+ `bigquery-public-data.idc_v23.dicom_metadata_curated` AS dicom_curated
85
89
  ON
86
90
  dicom_all.SOPInstanceUID = dicom_curated.SOPInstanceUID
87
91
  GROUP BY
@@ -3,7 +3,7 @@
3
3
  --
4
4
  -- Step 1: Declare variables
5
5
  DECLARE idc_versions ARRAY<INT64>;
6
- DECLARE latest_idc_version INT64 DEFAULT 22;
6
+ DECLARE latest_idc_version INT64 DEFAULT 23;
7
7
  DECLARE union_all_query STRING;
8
8
 
9
9
  --Step 2
@@ -7,7 +7,7 @@ from packaging.version import Version
7
7
 
8
8
  import idc_index_data as m
9
9
 
10
- EXPECTED_IDC_INDEX_VERSION = 22
10
+ EXPECTED_IDC_INDEX_VERSION = 23
11
11
 
12
12
 
13
13
  def test_version():
File without changes