commonmeta-ruby 3.3.16 → 3.3.17

Sign up to get free protection for your applications and to get access to all the features.
Files changed (30) hide show
  1. checksums.yaml +4 -4
  2. data/Gemfile.lock +1 -1
  3. data/lib/commonmeta/readers/json_feed_reader.rb +5 -6
  4. data/lib/commonmeta/utils.rb +14 -0
  5. data/lib/commonmeta/version.rb +1 -1
  6. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/blog_post_with_non-url_id.yml +18 -88
  7. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/blogger_post.yml +11 -50
  8. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/ghost_post_with_author_name_suffix.yml +64 -173
  9. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/ghost_post_with_doi.yml +13 -75
  10. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/ghost_post_with_institutional_author.yml +15 -11
  11. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/ghost_post_with_organizational_author.yml +15 -46
  12. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/ghost_post_without_doi.yml +17 -155
  13. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/jekyll_post.yml +14 -45
  14. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/jekyll_post_with_anonymous_author.yml +13 -16
  15. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/substack_post_with_broken_reference.yml +938 -1865
  16. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/syldavia_gazette_post_with_references.yml +128 -267
  17. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/upstream_post_with_references.yml +570 -1279
  18. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/wordpress_post.yml +12 -119
  19. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/wordpress_post_with_many_references.yml +4095 -5759
  20. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/wordpress_post_with_references.yml +24 -220
  21. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/get_json_feed_item_metadata/wordpress_post_with_tracking_code_on_url.yml +13 -12
  22. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/write_metadata_as_crossref/json_feed_item_from_rogue_scholar_with_anonymous_author.yml +13 -16
  23. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/write_metadata_as_crossref/json_feed_item_from_rogue_scholar_with_doi.yml +12 -119
  24. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/write_metadata_as_crossref/json_feed_item_from_rogue_scholar_with_organizational_author.yml +15 -46
  25. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/write_metadata_as_crossref/json_feed_item_from_upstream_blog.yml +13 -201
  26. data/spec/fixtures/vcr_cassettes/Commonmeta_Metadata/write_metadata_as_crossref/json_feed_item_with_references.yml +104 -813
  27. data/spec/readers/json_feed_reader_spec.rb +19 -21
  28. data/spec/utils_spec.rb +40 -0
  29. data/spec/writers/crossref_xml_writer_spec.rb +4 -4
  30. metadata +2 -2
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 1959fba18a127e97c92b94c7e0e78d42c4538e3bccf6b9e6019035931e19d2f4
4
- data.tar.gz: 190a4ddc0e6789c56f6f9a5a97355c8684e103abf121d2dfefdd5c1d816bd2d2
3
+ metadata.gz: 3d9089eaa55c76c89411f0b252418860d40c498b77ad5e07ff6937d26364fff4
4
+ data.tar.gz: b251346f6fd8fe1714632587ee46196b00c3c4bb8c4ba7bf0fe6decd54c5a9e3
5
5
  SHA512:
6
- metadata.gz: d5994587ca3efda69c8f1e4efca204a89db31d9e4b48a4b683e0312e32209c720f3a24506026152dd69d6ee49895919d72ee4d3aea6557da2b972a1fdb94092a
7
- data.tar.gz: 56b4e03114cff5155c502f08f953afb3f2ba13c82bdefecfed73b752131b6b718cd21460eaa8d6506b7b50ded9655330e7c040c833a81c5feeb105c489306ab9
6
+ metadata.gz: 87733ee7cf23b71317df6c8ef7ad2eea099db43a6291a948f93b18220aeff5f3cf72e8ec9a9b0e36b3f243fe7b651d1b7d401341d0cf0524d0a6c3ea0db1bc7f
7
+ data.tar.gz: 131dbb14b63cca5c62acce085746f0dc13ef99252bd9243a84c0565a5e671e45c613cc12903df297e4c9df8bd0f5a6d69b645d18e622dd895c0d120e0d7b7f46
data/Gemfile.lock CHANGED
@@ -1,7 +1,7 @@
1
1
  PATH
2
2
  remote: .
3
3
  specs:
4
- commonmeta-ruby (3.3.16)
4
+ commonmeta-ruby (3.3.17)
5
5
  activesupport (>= 4.2.5, < 8.0)
6
6
  addressable (~> 2.8.1, < 2.8.2)
7
7
  base32-url (>= 0.7.0, < 1)
@@ -21,7 +21,7 @@ module Commonmeta
21
21
  meta = string.present? ? JSON.parse(string) : {}
22
22
 
23
23
  url = normalize_url(meta.fetch("url", nil))
24
- id = options[:doi] ? normalize_doi(options[:doi]) : normalize_id(meta.fetch("id", nil))
24
+ id = options[:doi] ? normalize_doi(options[:doi]) : normalize_id(meta.fetch("doi", nil))
25
25
  id = url if id.blank? && url.present?
26
26
 
27
27
  type = "Article"
@@ -34,8 +34,8 @@ module Commonmeta
34
34
  publisher = { "name" => meta.dig("blog", "title") }
35
35
 
36
36
  date = {}
37
- date["published"] = get_iso8601_date(meta.dig("date_published")) if meta.dig("date_published").present?
38
- date["updated"] = get_iso8601_date(meta.dig("date_modified")) if meta.dig("date_modified").present?
37
+ date["published"] = get_date_from_unix_timestamp(meta.dig("published_at")) if meta.dig("published_at").present?
38
+ date["updated"] = get_date_from_unix_timestamp(meta.dig("updated_at")) if meta.dig("updated_at").present?
39
39
 
40
40
  license = if meta.dig("blog", "license").present?
41
41
  hsh_to_spdx("rightsURI" => meta.dig("blog", "license"))
@@ -62,7 +62,7 @@ module Commonmeta
62
62
  sum
63
63
  end
64
64
  references = get_references(meta)
65
- alternate_identifiers = [{ "alternateIdentifier" => meta["uuid"], "alternateIdentifierType" => "UUID" }]
65
+ alternate_identifiers = [{ "alternateIdentifier" => meta["id"], "alternateIdentifierType" => "UUID" }]
66
66
 
67
67
  { "id" => id,
68
68
  "type" => type,
@@ -83,7 +83,7 @@ module Commonmeta
83
83
 
84
84
  def get_references(meta)
85
85
  # check that references resolve
86
- Array.wrap(meta["references"]).reduce([]) do |sum, reference|
86
+ Array.wrap(meta["reference"]).reduce([]) do |sum, reference|
87
87
  begin
88
88
  if reference["doi"] && validate_doi(reference["doi"])
89
89
  response = HTTP.follow
@@ -122,7 +122,6 @@ module Commonmeta
122
122
  return { "string" => nil, "state" => "not_found" } unless response.status.success?
123
123
 
124
124
  posts = JSON.parse(response.body.to_s)
125
- puts posts.inspect
126
125
  posts.map { |post| post["id"] }.first
127
126
  end
128
127
 
@@ -1094,6 +1094,20 @@ module Commonmeta
1094
1094
  nil
1095
1095
  end
1096
1096
 
1097
+ # parsing of unix timestamps such as 1427846400
1098
+ def get_datetime_from_unix_timestamp(unix_timestamp)
1099
+ strip_milliseconds(DateTime.strptime(unix_timestamp.to_s, '%s').iso8601)
1100
+ rescue StandardError
1101
+ nil
1102
+ end
1103
+
1104
+ # parsing of unix timestamps such as 1427846400
1105
+ def get_date_from_unix_timestamp(unix_timestamp)
1106
+ DateTime.strptime(unix_timestamp.to_s, '%s').strftime('%Y-%m-%d')
1107
+ rescue StandardError
1108
+ nil
1109
+ end
1110
+
1097
1111
  # strip milliseconds if there is a time, as it interferes with edtc parsing
1098
1112
  # keep dates unchanged
1099
1113
  def strip_milliseconds(iso8601_time)
@@ -1,5 +1,5 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module Commonmeta
4
- VERSION = '3.3.16'
4
+ VERSION = '3.3.17'
5
5
  end
@@ -23,28 +23,28 @@ http_interactions:
23
23
  Cache-Control:
24
24
  - public, max-age=0, must-revalidate
25
25
  Content-Length:
26
- - '8562'
26
+ - '2106'
27
27
  Content-Type:
28
28
  - application/json; charset=utf-8
29
29
  Date:
30
- - Sun, 18 Jun 2023 15:23:52 GMT
30
+ - Mon, 10 Jul 2023 21:04:54 GMT
31
31
  Etag:
32
- - '"12ofvtx6pm66lo"'
32
+ - '"13pz9o7pqcg1mi"'
33
33
  Server:
34
34
  - Vercel
35
35
  Strict-Transport-Security:
36
36
  - max-age=63072000
37
37
  X-Matched-Path:
38
- - "/api/posts/[slug]"
38
+ - "/api/posts/[[...params]]"
39
39
  X-Vercel-Cache:
40
40
  - MISS
41
41
  X-Vercel-Id:
42
- - fra1::iad1::v8bjb-1687101832274-be4cfdb8ff78
42
+ - fra1::iad1::jbp2f-1689023094094-f2a6094c04f1
43
43
  Connection:
44
44
  - close
45
45
  body:
46
46
  encoding: UTF-8
47
- string: '{"id":"https://doi.org/10.59350/63055-a8604","uuid":"1898d2d7-4d87-4487-96c4-3073cf99e9a5","url":"http://sfmatheson.blogspot.com/2023/01/quintessence-of-dust-2023-restart-why.html","title":"Quintessence
47
+ string: '{"id":"1898d2d7-4d87-4487-96c4-3073cf99e9a5","doi":"https://doi.org/10.59350/63055-a8604","url":"http://sfmatheson.blogspot.com/2023/01/quintessence-of-dust-2023-restart-why.html","title":"Quintessence
48
48
  of Dust 2023 restart: the why","summary":"It''s early January 2023, a little
49
49
  before sunset in Tucson. Live image below, showing the glorious Santa Catalina
50
50
  mountains (the snow on the upper reaches is more apparent earlier in the day)
@@ -52,85 +52,15 @@ http_interactions:
52
52
  to start writing here at Quintessence of Dust, after another long hiatus.
53
53
  Here are some of my reasons.1. I like to write, and I have things to say,
54
54
  and I self-identify as an author. For eight years, I have co-organized and
55
- taught in...","date_published":"2023-01-09T03:03:00Z","date_modified":"2023-04-02T21:17:07Z","date_indexed":"2023-06-18T13:32:03.284651+00:00","authors":[{"url":null,"name":"Stephen
56
- Matheson"}],"image":null,"content_html":"It''s early January 2023, a little
57
- before sunset in Tucson. Live image below, showing the glorious Santa Catalina
58
- mountains (the snow on the upper reaches is more apparent earlier in the day)
59
- and my dinner preparations (shrimp and veggies on the grill).<div class=\"separator\"
60
- style=\"clear: both; text-align: center;\"><a href=\"https://blogger.googleusercontent.com/img/b/R29vZ2xl/AVvXsEghgBx9BU21qMDFnLxgHmnsl6TQVfb3QCwOXrC1zcXq7WH9gN8E0TcH3pTslRBG6O8mb5gcuF9JVtDlJ2je6dFcfyzKE4OD38-ftr66nBxddo892_NkyuevrrX65ndSbwmXMaLh3F5yiqU1QIj8JtA8FLkKOcHOEVwVafz0rzh7PejbFzp3XT25nQxc/s4032/Jan%207.jpg\"
61
- style=\"clear: right; float: right; margin-bottom: 1em; margin-left: 1em;\"><img
62
- border=\"0\" data-original-height=\"4032\" data-original-width=\"3024\" height=\"320\"
63
- src=\"https://blogger.googleusercontent.com/img/b/R29vZ2xl/AVvXsEghgBx9BU21qMDFnLxgHmnsl6TQVfb3QCwOXrC1zcXq7WH9gN8E0TcH3pTslRBG6O8mb5gcuF9JVtDlJ2je6dFcfyzKE4OD38-ftr66nBxddo892_NkyuevrrX65ndSbwmXMaLh3F5yiqU1QIj8JtA8FLkKOcHOEVwVafz0rzh7PejbFzp3XT25nQxc/s320/Jan%207.jpg\"
64
- width=\"240\" /></a></div><br /><div><div>I''ve decided to start writing here
65
- at <i>Quintessence of Dust</i>, after another long hiatus. Here are some of
66
- my reasons.</div><div><br /></div><div>1. I like to write, and I have things
67
- to say, and I self-identify as an author. For eight years, I have co-organized
68
- and taught in the <a href=\"https://meetings.cshl.edu/courses.aspx?course=C-WRITE&amp;year=23\"
69
- target=\"_blank\">Scientific Writing Retreat at Cold Spring Harbor Laboratory</a>.
70
- I''m a writer and I need to write, if only for myself.</div><div><br /></div><div>2.
71
- I have an idea for a book, along with some introductory work (but no sample
72
- chapters yet) and writing here will help me develop those thoughts. The idea
73
- is over twelve years old and has never faded away, which I take to mean that
74
- I need to get it out of my system somehow.</div><div><br /></div><div>3. I
75
- have other ideas kicking around in my head and most of them are worth writing
76
- about. I have one new intellectual passion that is totally worth writing about:
77
- <a href=\"https://skyislandalliance.org/the-sky-islands/\" target=\"_blank\">the
78
- Sky Islands</a>&nbsp;that nearly surround us here in Tucson.</div><div><br
79
- /></div><div>4. I have an exciting new job with great new people at <a href=\"https://plos.org/\"
80
- target=\"_blank\">an organization</a> that''s all in for <a href=\"https://plos.org/open-science/\"
81
- target=\"_blank\">open science</a>. I recently turned over the tens digit
82
- on my age-o-meter. My kids will very soon be all out of college. (One is about
83
- to start a postdoc!) All of this led, predictably, to a spasm of reflection
84
- on projects and vision. One clear result is that I''m feeling more inspired.<span><a
85
- name=''more''></a></span></div><div><br /></div><div>5. The demise of Twitter
86
- has led to a lot of <a href=\"https://www.theatlantic.com/technology/archive/2022/11/twitter-facebook-social-media-decline/672074/\"
87
- target=\"_blank\">useful commentary</a> about the nature of social media.
88
- I left Facebook two years ago and all but left Twitter two months ago. I''m
89
- on a&nbsp;<a href=\"https://fediscience.org/explore\" target=\"_blank\">good
90
- server at Mastodon</a>&nbsp;and I like it; maybe microblogging there can satisfy
91
- my desire for conversation and connection. But <a href=\"https://www.theverge.com/23513418/bring-back-personal-blogging\"
92
- target=\"_blank\">this recent piece</a> at <i>The Verge</i> by <a href=\"https://moniquejudge.com/\"
93
- target=\"_blank\">Monique Judge</a> convinced me that blogging could (again)
94
- have a place in the future.</div><div><br /><div>Here''s her summary, emphasis
95
- mine:</div><div><blockquote>At the end of the day, we don’t know what is going
96
- to happen next with Twitter or any of these platforms. We don’t know what
97
- changes <a href=\"https://www.techtarget.com/whatis/definition/Web-30\" target=\"_blank\">Web
98
- 3.0</a> is going to bring to the internet. We do know that <b>we will all
99
- still be here, wanting to share our thoughts, talk about anything and everything,
100
- and commune with our people</b>. Personal blogging is the simplest and fastest
101
- way to do all of that.&nbsp;</blockquote></div><div>That''s what I want! A
102
- place to write, and (if I''m lucky) a place to discuss and \"commune\" with
103
- people. That used to happen a lot at <i>Quintessence of Dust</i>.<span></span></div></div></div><div><br
104
- /></div><div>Okay, but why here? This blog is over 15 years old and was started
105
- when I was a Christian believer. <a href=\"https://sfmatheson.blogspot.com/2007/08/kicking-off-my-blog.html\"
106
- target=\"_blank\">Its founding themes</a> were anchored in a desire to help
107
- Christians understand and enjoy biology, to help them shake free of misinformation
108
- and dishonesty. It has twice languished through long hiatuses and was <a href=\"https://sfmatheson.blogspot.com/p/about.html\"
109
- target=\"_blank\">remodeled</a> back in 2017 a few years after I deconverted.
110
- Maybe it''s time to start anew? I think not, for many of those same reasons:
111
- I''m still a biologist who loves science, still worried about misinformation,
112
- and still rooted in the power of scientific explanation. I''m still a bardolator
113
- and a Red Sox fan. <a href=\"https://sfmatheson.blogspot.com/p/about.html\">I''m
114
- still me</a>, and <i>Quintessence of Dust</i> is still my blog. The new <a
115
- href=\"https://sfmatheson.blogspot.com/p/about.html\" target=\"_blank\">About
116
- page</a> is slightly remodeled from 2017, and hints at the next post, which
117
- will outline some new goals and ongoing projects.</div><div><br /></div><div>A
118
- final note on inspiration, from Imani Perry, writing in her newsletter (<a
119
- href=\"https://newsletters.theatlantic.com/unsettled-territory/\" target=\"_blank\">Unsettled
120
- Territory</a>) at <i>The Atlantic</i>. The piece is \"<a href=\"https://newsletters.theatlantic.com/unsettled-territory/63af3facace609003751bacc/becoming-writer-habit-journalism/\"
121
- target=\"_blank\">Writing is a Democratic Art</a>.\" It''s for subscribers
122
- only but here is her challenge:</div><div><blockquote>Thinking and writing
123
- at a faster pace stretched me and gave me greater confidence. Sometimes I
124
- changed my mind about what I’d written a day later. But that was okay; a newsletter
125
- is a moment in time. Writing it each week gave me a lovely rhythm in what
126
- has otherwise been a difficult and disorienting season in history. Feeling
127
- stuck can get you stuck. But writing can, and should, inspire deeds.</blockquote></div>","tags":["Introduction"],"language":"en","references":[],"blog_id":"5764g49","blog":{"id":"5764g49","title":"Quintessence
128
- of Dust","description":"<i>Quintessence of Dust</i> explores science, society,
129
- and human nature, focusing on genetics, development, evolution, neuroscience,
130
- systems biology, and topics related to scientific literacy. I occasionally
131
- discuss intelligent design, creationism, science denial, and other political/social
132
- influences on scientific literacy. Additional topics: philosophy, baseball,
133
- scientific culture, and Shakespeare. My main theme is <b><u>scientific explanation</u></b>.","language":"en","favicon":null,"feed_url":"http://sfmatheson.blogspot.com/feeds/posts/default","home_page_url":"http://sfmatheson.blogspot.com/","user_id":"8498eaf6-8c58-4b58-bc15-27eda292b1aa","created_at":"2023-05-31T14:21:27+00:00","indexed_at":"2023-04-18","feed_format":"application/atom+xml","license":"https://creativecommons.org/licenses/by/4.0/legalcode","generator":"Blogger
134
- 7.00","category":"Social Sciences","prefix":"10.59350","modified_at":"2023-06-06T20:22:00+00:00","version":"https://jsonfeed.org/version/1.1","backlog":true,"authors":null}}'
135
- recorded_at: Sun, 18 Jun 2023 15:23:52 GMT
136
- recorded_with: VCR 6.1.0
55
+ taught in...","published_at":1673233380,"updated_at":1680470227,"indexed_at":1689006804,"authors":[{"url":null,"name":"Stephen
56
+ Matheson"}],"image":null,"tags":["Introduction"],"language":"en","reference":[],"blog_id":"5764g49","blog_name":"Quintessence
57
+ of Dust","blog":{"id":"5764g49","title":"Quintessence of Dust","description":"<i>Quintessence
58
+ of Dust</i> explores science, society, and human nature, focusing on genetics,
59
+ development, evolution, neuroscience, systems biology, and topics related
60
+ to scientific literacy. I occasionally discuss intelligent design, creationism,
61
+ science denial, and other political/social influences on scientific literacy.
62
+ Additional topics: philosophy, baseball, scientific culture, and Shakespeare.
63
+ My main theme is <b><u>scientific explanation</u></b>.","language":"en","favicon":null,"feed_url":"http://sfmatheson.blogspot.com/feeds/posts/default","home_page_url":"http://sfmatheson.blogspot.com/","user_id":"8498eaf6-8c58-4b58-bc15-27eda292b1aa","created_at":"2023-05-31T14:21:27+00:00","indexed_at":"2023-04-18","feed_format":"application/atom+xml","license":"https://creativecommons.org/licenses/by/4.0/legalcode","generator":"Blogger
64
+ 7.00","category":"Social Sciences","prefix":"10.59350","modified_at":"2023-07-05T03:41:45+00:00","version":"https://jsonfeed.org/version/1.1","backlog":true,"current_feed_url":null,"expired":null}}'
65
+ recorded_at: Mon, 10 Jul 2023 21:04:54 GMT
66
+ recorded_with: VCR 6.2.0
@@ -23,28 +23,28 @@ http_interactions:
23
23
  Cache-Control:
24
24
  - public, max-age=0, must-revalidate
25
25
  Content-Length:
26
- - '6686'
26
+ - '2018'
27
27
  Content-Type:
28
28
  - application/json; charset=utf-8
29
29
  Date:
30
- - Sun, 18 Jun 2023 15:23:54 GMT
30
+ - Mon, 10 Jul 2023 21:04:51 GMT
31
31
  Etag:
32
- - '"w9llnwc692558"'
32
+ - '"rlf5k9cygn1ju"'
33
33
  Server:
34
34
  - Vercel
35
35
  Strict-Transport-Security:
36
36
  - max-age=63072000
37
37
  X-Matched-Path:
38
- - "/api/posts/[slug]"
38
+ - "/api/posts/[[...params]]"
39
39
  X-Vercel-Cache:
40
40
  - MISS
41
41
  X-Vercel-Id:
42
- - fra1::iad1::22vn2-1687101834016-bcd59dbcc91c
42
+ - fra1::iad1::9gxbv-1689023091514-026dffac583b
43
43
  Connection:
44
44
  - close
45
45
  body:
46
46
  encoding: UTF-8
47
- string: '{"id":"https://doi.org/10.59350/37y2z-gre70","uuid":"f3629c86-06e0-42c0-844a-266b03a91ef1","url":"https://iphylo.blogspot.com/2023/05/ten-years-and-million-links.html","title":"Ten
47
+ string: '{"id":"f3629c86-06e0-42c0-844a-266b03a91ef1","doi":"https://doi.org/10.59350/37y2z-gre70","url":"https://iphylo.blogspot.com/2023/05/ten-years-and-million-links.html","title":"Ten
48
48
  years and a million links","summary":"As trailed on a Twitter thread last
49
49
  week I’ve been working on a manuscript describing the efforts to map taxonomic
50
50
  names to their original descriptions in the taxonomic literature. Putting
@@ -52,52 +52,13 @@ http_interactions:
52
52
  basically “um, what, exactly, have you been doing all these years?”. TL;DR
53
53
  Across fungi, plants, and animals approx 1.3 million names have been linked
54
54
  to a persistent identifier for a publication.— Roderic Page (@rdmpage) May
55
- 25,...","date_published":"2023-05-31T17:26:00Z","date_modified":"2023-05-31T17:29:40Z","date_indexed":"2023-06-16T11:31:55.22232+00:00","authors":[{"url":null,"name":"Roderic
56
- Page"}],"image":null,"content_html":"<p>As trailed on a Twitter thread last
57
- week I’ve been working on a manuscript describing the efforts to map taxonomic
58
- names to their original descriptions in the taxonomic literature.</p>\n<blockquote
59
- class=\"twitter-tweet\"><p lang=\"en\" dir=\"ltr\">Putting together a manuscript
60
- on linking taxonomic names to the primary literature, basically “um, what,
61
- exactly, have you been doing all these years?”. TL;DR Across fungi, plants,
62
- and animals approx 1.3 million names have been linked to a persistent identifier
63
- for a publication.</p>— Roderic Page (@rdmpage) <a href=\"https://twitter.com/rdmpage/status/1661714128413573120?ref_src=twsrc%5Etfw\">May
64
- 25, 2023</a></blockquote> \n<p>The preprint is on bioRxiv <a href=\"https://doi.org/10.1101/2023.05.29.542697\">doi:10.1101/2023.05.29.542697</a></p>\n<blockquote>\n<p>A
65
- major gap in the biodiversity knowledge graph is a connection between taxonomic
66
- names and the taxonomic literature. While both names and publications often
67
- have persistent identifiers (PIDs), such as Life Science Identifiers (LSIDs)
68
- or Digital Object Identifiers (DOIs), LSIDs for names are rarely linked to
69
- DOIs for publications. This article describes efforts to make those connections
70
- across three large taxonomic databases: Index Fungorum, International Plant
71
- Names Index (IPNI), and the Index of Organism Names (ION). Over a million
72
- names have been matched to DOIs or other persistent identifiers for taxonomic
73
- publications. This represents approximately 36% of names for which publication
74
- data is available. The mappings between LSIDs and publication PIDs are made
75
- available through ChecklistBank. Applications of this mapping are discussed,
76
- including a web app to locate the citation of a taxonomic name, and a knowledge
77
- graph that uses data on researcher’s ORCID ids to connect taxonomic names
78
- and publications to authors of those names.</p>\n</blockquote>\n<p>Much of
79
- the work has been linking taxa to names, which still has huge gaps. There
80
- are also interesting differences in coverage between plants, animals, and
81
- fungi (see preprint for details).</p>\n\n<div class=\"separator\" style=\"clear:
82
- both;\"><a href=\"https://blogger.googleusercontent.com/img/b/R29vZ2xl/AVvXsEhdWsSQhqi1DErXMIHm28g37-fiALNIsI5eQZmvoX_Fe03ZSwtKHbYt-LCsCCAUop0AGcwy_w7NpIjylVH1hNrM9oW-6j9e6tHASha49TTqFvDg2_tEx3r74RRFsjUo4M_Qat8NmKaZSChOt2hI3LsMjTVLrEVirEckU-9Ei7ug-7OHQlR4LA/s2276/animals-coverage.png\"
83
- style=\"display: block; padding: 1em 0; text-align: center; \"><img alt=\"\"
84
- border=\"0\" width=\"320\" data-original-height=\"2276\" data-original-width=\"2276\"
85
- src=\"https://blogger.googleusercontent.com/img/b/R29vZ2xl/AVvXsEhdWsSQhqi1DErXMIHm28g37-fiALNIsI5eQZmvoX_Fe03ZSwtKHbYt-LCsCCAUop0AGcwy_w7NpIjylVH1hNrM9oW-6j9e6tHASha49TTqFvDg2_tEx3r74RRFsjUo4M_Qat8NmKaZSChOt2hI3LsMjTVLrEVirEckU-9Ei7ug-7OHQlR4LA/s320/animals-coverage.png\"/></a></div><div
86
- class=\"separator\" style=\"clear: both;\"><a href=\"https://blogger.googleusercontent.com/img/b/R29vZ2xl/AVvXsEjdyxlVJ-oyMCNPmHtHWjSxdxMSJvgzdWRGRF6Ad4dk7ab7gGDpuKdKmS9XhROkopw361ylfsTd1ZkwkF6BN0JlWNnVLCKY1AfryCfWKHkgPQM7u-0SELW9j8RlQIflb6ibaV64gwW7oJrEvOGECvR51F8EW8cRg-1usW-GBM5ymObj7zlObQ/s2276/fungi-coverage.png\"
87
- style=\"display: block; padding: 1em 0; text-align: center; \"><img alt=\"\"
88
- border=\"0\" width=\"320\" data-original-height=\"2276\" data-original-width=\"2276\"
89
- src=\"https://blogger.googleusercontent.com/img/b/R29vZ2xl/AVvXsEjdyxlVJ-oyMCNPmHtHWjSxdxMSJvgzdWRGRF6Ad4dk7ab7gGDpuKdKmS9XhROkopw361ylfsTd1ZkwkF6BN0JlWNnVLCKY1AfryCfWKHkgPQM7u-0SELW9j8RlQIflb6ibaV64gwW7oJrEvOGECvR51F8EW8cRg-1usW-GBM5ymObj7zlObQ/s320/fungi-coverage.png\"/></a></div><div
90
- class=\"separator\" style=\"clear: both;\"><a href=\"https://blogger.googleusercontent.com/img/b/R29vZ2xl/AVvXsEgf0YBuvNSXWAJTfQ1jk4XSocMzCYHP7t6IPUqhjQ3mftgM_850igWaD2copgNH6Xk6T62xBU641wvwOvXgCCDY3m2xC_gaILXO9RGx8H3Gpy5OOncsLb9smpT2LIgtYOExVBVdDRWqA0AZ8-mQjWL7dL5TiG7MqVu8spT8ACoGOPR_T36hRA/s2276/plants-coverage.png\"
91
- style=\"display: block; padding: 1em 0; text-align: center; \"><img alt=\"\"
92
- border=\"0\" width=\"320\" data-original-height=\"2276\" data-original-width=\"2276\"
93
- src=\"https://blogger.googleusercontent.com/img/b/R29vZ2xl/AVvXsEgf0YBuvNSXWAJTfQ1jk4XSocMzCYHP7t6IPUqhjQ3mftgM_850igWaD2copgNH6Xk6T62xBU641wvwOvXgCCDY3m2xC_gaILXO9RGx8H3Gpy5OOncsLb9smpT2LIgtYOExVBVdDRWqA0AZ8-mQjWL7dL5TiG7MqVu8spT8ACoGOPR_T36hRA/s320/plants-coverage.png\"/></a></div>\n\n\nThere
94
- is also a simple app to demonstrate these links, see <a href=\"https://species-cite.herokuapp.com\">https://species-cite.herokuapp.com</a>.\n\n\n\n<blockquote>\n<p>Written
95
- with <a href=\"https://stackedit.io/\">StackEdit</a>.</p>\n</blockquote>","tags":[],"language":"en","references":[],"blog_id":"tyfqw20","blog":{"id":"tyfqw20","title":"iPhylo","description":"Rants,
55
+ 25,...","published_at":1685553960,"updated_at":1685554180,"indexed_at":1689006804,"authors":[{"url":"https://orcid.org/0000-0002-7101-9767","name":"Roderic
56
+ Page"}],"image":null,"tags":[],"language":"en","reference":[],"blog_id":"tyfqw20","blog_name":"iPhylo","blog":{"id":"tyfqw20","title":"iPhylo","description":"Rants,
96
57
  raves (and occasionally considered opinions) on phyloinformatics, taxonomy,
97
58
  and biodiversity informatics. For more ranty and less considered opinions,
98
59
  see my <a href=\"https://twitter.com/rdmpage\">Twitter feed</a>.<br>ISSN 2051-8188.
99
60
  Written content on this site is licensed under a <a href=\"https://creativecommons.org/licenses/by/4.0/\">Creative
100
61
  Commons Attribution 4.0 International license</a>.","language":"en","favicon":null,"feed_url":"https://iphylo.blogspot.com/feeds/posts/default","home_page_url":"https://iphylo.blogspot.com/","user_id":"8498eaf6-8c58-4b58-bc15-27eda292b1aa","created_at":"2023-05-31T08:03:14+00:00","indexed_at":"2023-02-06","feed_format":"application/atom+xml","license":"https://creativecommons.org/licenses/by/4.0/legalcode","generator":"Blogger
101
- 7.00","category":"Natural Sciences","prefix":"10.59350","modified_at":"2023-05-31T17:26:00+00:00","version":"https://jsonfeed.org/version/1.1","backlog":true,"authors":null}}'
102
- recorded_at: Sun, 18 Jun 2023 15:23:54 GMT
103
- recorded_with: VCR 6.1.0
62
+ 7.00","category":"Natural Sciences","prefix":"10.59350","modified_at":"2023-06-17T15:38:20+00:00","version":"https://jsonfeed.org/version/1.1","backlog":true,"current_feed_url":null,"expired":null}}'
63
+ recorded_at: Mon, 10 Jul 2023 21:04:52 GMT
64
+ recorded_with: VCR 6.2.0
@@ -13,6 +13,52 @@ http_interactions:
13
13
  - rogue-scholar.org
14
14
  User-Agent:
15
15
  - http.rb/5.1.1
16
+ response:
17
+ status:
18
+ code: 404
19
+ message: Not Found
20
+ headers:
21
+ Age:
22
+ - '0'
23
+ Cache-Control:
24
+ - public, max-age=0, must-revalidate
25
+ Content-Length:
26
+ - '28'
27
+ Content-Type:
28
+ - application/json; charset=utf-8
29
+ Date:
30
+ - Mon, 10 Jul 2023 21:04:46 GMT
31
+ Etag:
32
+ - '"jtxxi9yf69s"'
33
+ Server:
34
+ - Vercel
35
+ Strict-Transport-Security:
36
+ - max-age=63072000
37
+ X-Matched-Path:
38
+ - "/api/posts/[[...params]]"
39
+ X-Vercel-Cache:
40
+ - MISS
41
+ X-Vercel-Id:
42
+ - fra1::iad1::bkz2t-1689023085834-cfabfa78ce26
43
+ Connection:
44
+ - close
45
+ body:
46
+ encoding: UTF-8
47
+ string: '{"message":"Post not found"}'
48
+ recorded_at: Mon, 10 Jul 2023 21:04:46 GMT
49
+ - request:
50
+ method: get
51
+ uri: https://rogue-scholar.org/api/posts/153d65e1-f0e4-49a6-a969-33d2129800ba
52
+ body:
53
+ encoding: UTF-8
54
+ string: ''
55
+ headers:
56
+ Connection:
57
+ - close
58
+ Host:
59
+ - rogue-scholar.org
60
+ User-Agent:
61
+ - http.rb/5.1.1
16
62
  response:
17
63
  status:
18
64
  code: 200
@@ -23,193 +69,38 @@ http_interactions:
23
69
  Cache-Control:
24
70
  - public, max-age=0, must-revalidate
25
71
  Content-Length:
26
- - '14782'
72
+ - '1692'
27
73
  Content-Type:
28
74
  - application/json; charset=utf-8
29
75
  Date:
30
- - Sun, 18 Jun 2023 15:23:53 GMT
76
+ - Tue, 11 Jul 2023 05:58:11 GMT
31
77
  Etag:
32
- - '"wzh4e4jhaxbem"'
78
+ - '"z7ox1e74871b0"'
33
79
  Server:
34
80
  - Vercel
35
81
  Strict-Transport-Security:
36
82
  - max-age=63072000
37
83
  X-Matched-Path:
38
- - "/api/posts/[slug]"
84
+ - "/api/posts/[[...params]]"
39
85
  X-Vercel-Cache:
40
86
  - MISS
41
87
  X-Vercel-Id:
42
- - fra1::iad1::r4svw-1687101833448-3467c5c4b7d4
88
+ - fra1::iad1::kz72z-1689055090778-9a199d4a33af
43
89
  Connection:
44
90
  - close
45
91
  body:
46
92
  encoding: UTF-8
47
- string: '{"id":"https://doi.org/10.59350/ytvy2-59450","uuid":"6179ad80-cc7f-4904-9260-0ecb3c3a90ba","url":"https://www.ideasurg.pub/academic-powerhouse/","title":"How
48
- to Build an Academic Powerhouse: Let''s Study Who''s Doing it","summary":"A
49
- Data Exploration with Public Data from the Academic Surgical Congress","date_published":"2023-06-03T04:54:30Z","date_modified":null,"date_indexed":"2023-06-16T14:13:56.969774+00:00","authors":[{"url":null,"name":"Tejas
50
- S. Sathe, MD"}],"image":null,"content_html":"<p>Students and residents aspiring
51
- for a career in academic surgery are looking for training programs that will
52
- help jumpstart their careers by exposing them to mentorship and opportunities
53
- to conduct research. While the gold standard of academic productivity (for
54
- the time being) remains peer-reviewed publications, conference presentations
55
- are an important secondary metric. In addition to feeding eventual papers,
56
- conference talks allow trainees to practice presentation skills, build their
57
- networks, and learn about the work being done at peer institutions and the
58
- field more broadly. Residents pursuing professional development are encouraged
59
- to apply to and attend conferences, though in the post COVID era the cost
60
- of conference attendance and travel are being re-evaluated. Even moreso than
61
- publications, conference presentations are typically led by students and residents.
62
- For now, academic conference participation can serve as an important albeit
63
- limited metric to evaluate an overall institution''s research power &#x2013;
64
- especially as it relates to trainees.</p><p>In order to understand how to
65
- build a successful research program, we wanted to understand who had already
66
- done so. Conceivably, by finding successful examples, we can conduct interviews
67
- and focus groups among key stakeholders at these programs to understand what
68
- they did, and how these actions can be replicated. We were particularly interested
69
- in seeing which programs demonstrated a high number of accepted abstracts
70
- and which programs were able to improve their abstract performance from year
71
- to year. </p><p>The <a href=\"https://www.academicsurgicalcongress.org/?ref=ideasurg.pub\">Academic
72
- Surgical Congress</a> (ASC) is a joint surgical meeting co-hosted by the <a
73
- href=\"https://www.aasurg.org/?ref=ideasurg.pub\">Association for Academic
74
- Surgery</a> (AAS) and the <a href=\"https://www.susweb.org/?ref=ideasurg.pub\">Society
75
- for University Surgeons</a> (SUS) and held annually in February. Anecdotally,
76
- it is a popular conference for students and residents to attend. The ASC maintains
77
- a public archive of all abstracts dating from 2015-2020. We obtained a machine
78
- readable version of this public database through the webmaster (this version
79
- of the data spans 2016 to 2023).</p><p>For each abstract, we looked at the
80
- year and primary institution at which the work was conducted. In order to
81
- intuit the primary institution, we searched the institution block string for
82
- the first presence of \"university\", \"hospital\", \"institute\", or \"medical
83
- center\" or the first expression to occur before a comma. This method was
84
- chosen as institutions&#x2019; names are written variably (Department of Surgery,
85
- University Hospital, New York, NY vs. University Hospital, Division of Colorectal
86
- Surgery, Department of Surgery, New York, NY). Unfortunately, our code is
87
- unable to merge slight variations in the resultant institution name (University
88
- of Michigan vs. University of Michigan Ann Arbor). </p><p>In order to do a
89
- primary survey of institutional trends in this dataset, we conducted the following
90
- analyses. First, we measured the number of abstracts accepted each year from
91
- 2016 to 2023. Second, we looked at the number of accepted abstracts by institution
92
- over the entire study period. Then, we looked at the number of abstract institutions
93
- by institution and year to study changes in institutional trends over time.
94
- Finally, we did a subset analysis on post-COVID data (2021 to 2023) to look
95
- at absolute and per cent year-over-year changes in accepted abstracts to see
96
- which institutions were able to significantly increase their abstract performance
97
- in one year. </p><h3 id=\"accepted-abstracts-are-increasing-but-down-from-peak\">Accepted
98
- Abstracts are increasing but down from peak</h3><p>We plotted the total number
99
- of abstracts accepted by year. The number of accepted abstracts increased
100
- from 1125 in 2016 to an all-time high of 1742 in 2020 before declining to
101
- 922 and 848 in 2021 and 2022, respectively. Accepted abstracts have since
102
- rebounded to 1469 in 2023, or roughly 84% of the maximum amount. Of note,
103
- the 2021 and 2022 meetings were held virtually due to the COVID-19 pandemic.
104
- Conversely the 2020 meeting was held immediately prior to the institution
105
- of lockdowns and other social distancing policies.</p><figure class=\"kg-card
106
- kg-image-card kg-width-wide\"><img src=\"https://www.ideasurg.pub/content/images/2023/06/newplot--1-.png\"
107
- class=\"kg-image\" alt loading=\"lazy\" width=\"1400\" height=\"800\" srcset=\"https://www.ideasurg.pub/content/images/size/w600/2023/06/newplot--1-.png
108
- 600w, https://www.ideasurg.pub/content/images/size/w1000/2023/06/newplot--1-.png
109
- 1000w, https://www.ideasurg.pub/content/images/2023/06/newplot--1-.png 1400w\"
110
- sizes=\"(min-width: 1200px) 1200px\"></figure><h3 id=\"alabama-michigan-lead-abstract-acceptances-during-study-period\">Alabama,
111
- Michigan lead abstract acceptances during study period</h3><p>Next, we plotted
112
- the total number of accepted abstracts by institution. The graph shows data
113
- for the twenty leading institutions. The University of Alabama and the University
114
- of Michigan lead in abstract acceptances during the study period (477 and
115
- 348, respectively). Given an eight year time-range, the top twenty institutions
116
- reflect an average annual abstract acceptance ranging from roughly thirteen
117
- to 60.</p><figure class=\"kg-card kg-image-card kg-width-wide\"><img src=\"https://www.ideasurg.pub/content/images/2023/06/newplot--2-.png\"
118
- class=\"kg-image\" alt loading=\"lazy\" width=\"1400\" height=\"800\" srcset=\"https://www.ideasurg.pub/content/images/size/w600/2023/06/newplot--2-.png
119
- 600w, https://www.ideasurg.pub/content/images/size/w1000/2023/06/newplot--2-.png
120
- 1000w, https://www.ideasurg.pub/content/images/2023/06/newplot--2-.png 1400w\"
121
- sizes=\"(min-width: 1200px) 1200px\"></figure><p>We also plotted the number
122
- of accepted abstracts by year using a separate line plot for each individual.
123
- While Michigan has maintained between 30 and 60 abstracts for each year, Alabama
124
- went from 6 to 48 abstracts between 2016 and 2017 and has maintained greater
125
- than 60 accepted abstracts each year. There is a notable dip in the number
126
- of accepted abstracts from 2021 to 2022, consistent with a similar trend in
127
- the total yearly acceptance data. </p><figure class=\"kg-card kg-image-card
128
- kg-width-wide\"><img src=\"https://www.ideasurg.pub/content/images/2023/06/newplot--8-.png\"
129
- class=\"kg-image\" alt loading=\"lazy\" width=\"1400\" height=\"800\" srcset=\"https://www.ideasurg.pub/content/images/size/w600/2023/06/newplot--8-.png
130
- 600w, https://www.ideasurg.pub/content/images/size/w1000/2023/06/newplot--8-.png
131
- 1000w, https://www.ideasurg.pub/content/images/2023/06/newplot--8-.png 1400w\"
132
- sizes=\"(min-width: 1200px) 1200px\"></figure><p>Overall, there appears to
133
- be a general clustering of the other eighteen institutions in the top twenty,
134
- a trend seen in both the aggregate and the year-to-year data.</p><h3 id=\"mgh-brigham-lead-absolute-and-per-cent-increase-in-abstracts-in-2023\">MGH,
135
- Brigham lead absolute and per cent increase in abstracts in 2023</h3><p>Next,
136
- we measured the absolute and percent change between accepted abstracts in
137
- consecutive years for the top twenty institutions. We restricted our analysis
138
- to 2021, 2022, and 2023. The greatest absolute increases in accepted abstracts
139
- came from Massachusetts General Hospital in 2023 (27), Brigham and Women''s
140
- Hospital in 2023 (16), and UCLA in 2022 (16). The greatest percentage increases
141
- in accepted abstracts came from Brigham and Women''s Hospital in 2023 (800%),
142
- Johns Hopkins in 2023 (500%), and Massachusetts General Hospital in 2023 (386%).
143
- Of note, Johns Hopkins and Brigham and Women''s Hospital also had the largest
144
- absolute and percentage decrease in accepted abstracts in 2022. Interestingly,
145
- University of Alabama (+4 in 2022, +3 in 2023) and University of Michigan
146
- (+11 in 2023) &#xA0;- which rank at the top in all time and yearly abstracts
147
- - experienced less extreme swings during the 2021-2023 time period.</p><figure
148
- class=\"kg-card kg-image-card kg-width-wide\"><img src=\"https://www.ideasurg.pub/content/images/2023/06/newplot--7-.png\"
149
- class=\"kg-image\" alt loading=\"lazy\" width=\"1400\" height=\"800\" srcset=\"https://www.ideasurg.pub/content/images/size/w600/2023/06/newplot--7-.png
150
- 600w, https://www.ideasurg.pub/content/images/size/w1000/2023/06/newplot--7-.png
151
- 1000w, https://www.ideasurg.pub/content/images/2023/06/newplot--7-.png 1400w\"
152
- sizes=\"(min-width: 1200px) 1200px\"></figure><figure class=\"kg-card kg-image-card
153
- kg-width-wide\"><img src=\"https://www.ideasurg.pub/content/images/2023/06/newplot--4-.png\"
154
- class=\"kg-image\" alt loading=\"lazy\" width=\"1400\" height=\"800\" srcset=\"https://www.ideasurg.pub/content/images/size/w600/2023/06/newplot--4-.png
155
- 600w, https://www.ideasurg.pub/content/images/size/w1000/2023/06/newplot--4-.png
156
- 1000w, https://www.ideasurg.pub/content/images/2023/06/newplot--4-.png 1400w\"
157
- sizes=\"(min-width: 1200px) 1200px\"></figure><h3 id=\"conclusions\">Conclusions</h3><p>In
158
- this data exploration, we analyzed abstract acceptance data for the Academic
159
- Surgical Congress between 2016 and 2023. We showed that the number of abstracts
160
- increased from 2016 to 2020, dipped in 2021 and 2022, and is recovering in
161
- 2023 - likely reflecting the variability forced by COVID19 and the transition
162
- to virtual conferences in 2021 and 2022. We also showed that the University
163
- of Alabama and the University of Michigan have significantly led accepted
164
- abstracts throughout the study period with University of Alabama maintaining
165
- a top position following an impressive 700 percent increase in abstracts between
166
- 2016 and 2017. In 2023, Massachusetts General Hospital and Brigham and Women''s
167
- Hospital have led absolute and percent increases in abstract submissions,
168
- though this may reflect some degree of reversion following drops in abstract
169
- acceptances in 2022.</p><h3 id=\"limitations-and-future-directions\">Limitations
170
- and Future Directions</h3><p>This data exploration has several limitations.
171
- First, our study is limited to one conference and conferences themselves are
172
- only a limited component of academic productivity. However, the Academic Surgical
173
- Congress is an international meeting that is well regarded, popular among
174
- trainees, and has consistent multi-year data. Another limitation of our study
175
- is our assumption that the first institution listed in the author block is
176
- the primary institution&#x2013;a method which does not take into account multi-institutional
177
- abstracts. However, we suspect this reflects the minority of the abstracts.
178
- Finally, we have not fully optimized name-matching to correctly combine terms
179
- like \"University of Michigan\" and \"University of Michigan Ann Arbor\".
180
- However, given that most of the data currently is only for the top 20 institutions,
181
- we believe the overall trends will be preserved.</p><p>In the future, we can
182
- attempt to obtain more granular data on authors and institutions and optimize
183
- the capture of this data for aggregated analysis. We are also researching
184
- different techniques to perform string matching to fix the institution name
185
- issue. We can improve the generalizability of our findings by bringing in
186
- similar data from other large meetings &#x2013; such as the American College
187
- of Surgeons Clinical Congress and the Society of American Gastrointestinal
188
- and Endoscopic Surgeons (SAGES). We can also use the PubMed API to perform
189
- similar analyses in top surgical journals such as JAMA Surgery or the Annals
190
- of Surgery.</p><p>With regards to the data we have obtained, we can conduct
191
- survey-based studies or focus groups with key stakeholders from institutions
192
- that have demonstrated strong abstract performance during the study period
193
- as well as those who have shown significant improvement. By talking to department
194
- chairs, program directors, and research and education leaders we can understand
195
- what steps each institution took to improve abstract acceptance (e.g. hiring
196
- a new research faculty, creating a mentorship program, providing administrative
197
- support for IRBs/stats etc.). Following this, we can map individual interventions
198
- to improvements to understand the contribution that each can have on increased
199
- academic productivity.</p><p>We have also not yet mined the abstract body
200
- for themes. Using natural language processing, we can understand how themes
201
- and trends of emergent research change from year to year, and even develop
202
- models to predict which topics will be of interest in future works. This will
203
- likely be the subject of a future data exploration.</p><p>Overall, we hope
204
- to demonstrate that abstract acceptance data from a single international meeting
205
- can provide interesting, meaningful data on which programs have strong research
206
- infrastructure and which programs are making strides to achieve it. By studying
207
- this data and improving the inputs, we can better understand whose example
208
- to follow and ultimately develop a playbook that all institutions can employ
209
- to maximize the academic opportunities of students and trainees.</p><h3 id=\"see-the-data\">See
210
- the Data</h3><p>You can see the raw data as well as all of our code here,
211
- and use this for your own studies with appropriate attribution.</p><p><a href=\"https://deepnote.com/@tejas-sathe-a73f/ASC-Data-Exploration-948ca211-bfc7-459b-9d6d-ef952a5baf32?ref=ideasurg.pub\">https://deepnote.com/@tejas-sathe-a73f/ASC-Data-Exploration-948ca211-bfc7-459b-9d6d-ef952a5baf32</a></p>","tags":["Pre-Print"],"language":"en","references":[],"blog_id":"3cxcm20","blog":{"id":"3cxcm20","title":"I.D.E.A.S.","description":"Innovation
93
+ string: '{"id":"153d65e1-f0e4-49a6-a969-33d2129800ba","doi":"https://doi.org/10.59350/ytvy2-59450","url":"https://www.ideasurg.pub/academic-powerhouse","title":"How
94
+ to Build an Academic Powerhouse: Let''s Study Who''s Doing it","summary":"Students
95
+ and residents aspiring for a career in academic surgery are looking for training
96
+ programs that will help jumpstart their careers by exposing them to mentorship
97
+ and opportunities to conduct research. While the gold standard of academic
98
+ productivity (for the time being) remains peer-reviewed publications, conference
99
+ posters and presentations are an important secondary metric. In addition to
100
+ feeding eventual papers, conference talks allow trainees to practice presentation
101
+ skills, build...","published_at":1685768070,"updated_at":1685768070,"indexed_at":1689006804,"authors":[{"url":null,"name":"Tejas
102
+ S. Sathe, MD"}],"image":null,"tags":["Pre-Print"],"language":"en","reference":[],"blog_id":"3cxcm20","blog_name":"I.D.E.A.S.","blog":{"id":"3cxcm20","title":"I.D.E.A.S.","description":"Innovation
212
103
  and Design Experiments in Academic Surgery (I.D.E.A.S.)","language":"en","favicon":"https://www.ideasurg.pub/favicon.png","feed_url":"https://www.ideasurg.pub/rss/","home_page_url":"https://www.ideasurg.pub/","user_id":"8498eaf6-8c58-4b58-bc15-27eda292b1aa","created_at":"2023-05-31T13:44:29+00:00","indexed_at":"2023-01-04","feed_format":"application/rss+xml","license":"https://creativecommons.org/licenses/by/4.0/legalcode","generator":"Ghost
213
- 5.51","category":"Medical and Health Sciences","prefix":"10.59350","modified_at":"2023-06-03T04:54:30+00:00","version":"https://jsonfeed.org/version/1.1","backlog":false,"authors":null}}'
214
- recorded_at: Sun, 18 Jun 2023 15:23:53 GMT
215
- recorded_with: VCR 6.1.0
104
+ 5.53","category":"Medical and Health Sciences","prefix":"10.59350","modified_at":"2023-06-03T04:54:30+00:00","version":"https://jsonfeed.org/version/1.1","backlog":false,"current_feed_url":null,"expired":null}}'
105
+ recorded_at: Tue, 11 Jul 2023 05:58:11 GMT
106
+ recorded_with: VCR 6.2.0