RubyGems - youtube-transcript-rb - Versions diffs - 0.2.0 → 0.2.3 - Mend

youtube-transcript-rb 0.2.0 → 0.2.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

checksums.yaml +4 -4
data/.rubocop.yml +9 -0
data/.rubocop_todo.yml +166 -0
data/README.md +9 -9
data/lib/youtube-transcript-rb.rb +4 -0
data/lib/youtube_rb/formatters.rb +263 -0
data/lib/youtube_rb/transcript/api.rb +7 -11
data/lib/youtube_rb/transcript/errors.rb +3 -3
data/lib/youtube_rb/transcript/transcript.rb +2 -2
data/lib/youtube_rb/transcript/transcript_list.rb +3 -3
data/lib/youtube_rb/transcript/transcript_list_fetcher.rb +16 -19
data/lib/youtube_rb/transcript.rb +0 -2
data/lib/youtube_rb/{transcript/version.rb → version.rb} +1 -3
data/sig/youtube_rb/transcript.rbs +0 -2
data/spec/api_spec.rb +8 -8
data/spec/errors_spec.rb +2 -2
data/spec/formatters_spec.rb +34 -35
data/spec/integration_spec.rb +14 -23
data/spec/spec_helper.rb +51 -51
data/spec/transcript_list_fetcher_spec.rb +11 -6
data/spec/transcript_list_spec.rb +15 -18
data/spec/transcript_spec.rb +9 -10
metadata +8 -4
data/lib/youtube_rb/transcript/formatters.rb +0 -267

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 6d97023aca42aac08e42c3857d940e3a42ba735c895685522048caee415fe4af
-  data.tar.gz: 1d435b06743716beb8f3e892bc97a2c7d105f6ab710f61659cd24dd6ce438a81
+  metadata.gz: 60cad31d1d80bf186d231cf3eed48cd1599f41000a3de1a185e24480421ea0dd
+  data.tar.gz: cc370e6e42208f18a0ed456800de0f2e8b470754c63908149171c5558e15500a
 SHA512:
-  metadata.gz: 5b5f345ebcef944ba98ae4adcc42d9951c5e04bf0230e98c18dc41e0b3b715cfe57a34722924042cbcf9b7244d00ad31767bc2ce287136656c2b05b3378f2db8
-  data.tar.gz: 07ba07e26a8ff0f895c64767869bda918122c35b21b39b945fc608067d864643712386987155e3ae1dbe24f5310410e642aa58fd03f1c15f4df358567a51fae2
+  metadata.gz: 42f16cf9961a05528f4289886ebb08b2b06cb9060fbecfc6b41ffd4267920ef0d2123afec048c231a4f507bd44a8f1df9e383addbb3390e4e9076d9617bb22ba
+  data.tar.gz: b529273917d15dca2f50d28b5c7ea6f04d359c111346bd0ef4547db86b7a016dae83fdefce80b75784b43849931c6595c67833d4977e8b816176bca027883491

data/.rubocop.yml ADDED Viewed

@@ -0,0 +1,9 @@
+inherit_from: .rubocop_todo.yml
+plugins:
+  - rubocop-rake
+  - rubocop-rspec
+AllCops:
+  NewCops: enable
+  TargetRubyVersion: 3.2

data/.rubocop_todo.yml ADDED Viewed

@@ -0,0 +1,166 @@
+# This configuration was generated by
+# `rubocop --auto-gen-config`
+# on 2026-01-09 13:39:24 UTC using RuboCop version 1.82.1.
+# The point is for the user to remove these configuration records
+# one by one as the offenses are removed from the code base.
+# Note that changes in the inspected code, or installation of new
+# versions of RuboCop, may require this file to be generated again.
+# Offense count: 3
+# This cop supports safe autocorrection (--autocorrect).
+# Configuration parameters: AllowUnusedKeywordArguments, IgnoreEmptyMethods, IgnoreNotImplementedMethods, NotImplementedExceptions.
+# NotImplementedExceptions: NotImplementedError
+Lint/UnusedMethodArgument:
+  Exclude:
+    - 'lib/youtube_rb/formatters.rb'
+# Offense count: 3
+# Configuration parameters: AllowedMethods, AllowedPatterns, CountRepeatedAttributes.
+Metrics/AbcSize:
+  Max: 25
+# Offense count: 1
+# Configuration parameters: CountComments, CountAsOne.
+Metrics/ClassLength:
+  Max: 103
+# Offense count: 2
+# Configuration parameters: AllowedMethods, AllowedPatterns.
+Metrics/CyclomaticComplexity:
+  Max: 14
+# Offense count: 7
+# Configuration parameters: CountComments, CountAsOne, AllowedMethods, AllowedPatterns.
+Metrics/MethodLength:
+  Max: 29
+# Offense count: 1
+# Configuration parameters: CountKeywordArgs, MaxOptionalParameters.
+Metrics/ParameterLists:
+  Max: 7
+# Offense count: 2
+# Configuration parameters: AllowedMethods, AllowedPatterns.
+Metrics/PerceivedComplexity:
+  Max: 15
+# Offense count: 1
+# Configuration parameters: ExpectMatchingDefinition, CheckDefinitionPathHierarchy, CheckDefinitionPathHierarchyRoots, Regex, IgnoreExecutableScripts, AllowedAcronyms.
+# CheckDefinitionPathHierarchyRoots: lib, spec, test, src
+# AllowedAcronyms: CLI, DSL, ACL, API, ASCII, CPU, CSS, DNS, EOF, GUID, HTML, HTTP, HTTPS, ID, IP, JSON, LHS, QPS, RAM, RHS, RPC, SLA, SMTP, SQL, SSH, TCP, TLS, TTL, UDP, UI, UID, UUID, URI, URL, UTF8, VM, XML, XMPP, XSRF, XSS
+Naming/FileName:
+  Exclude:
+    - 'Rakefile.rb'
+    - 'lib/youtube-transcript-rb.rb'
+# Offense count: 3
+# Configuration parameters: MinNameLength, AllowNamesEndingInNumbers, AllowedNames, ForbiddenNames.
+# AllowedNames: as, at, by, cc, db, id, if, in, io, ip, of, on, os, pp, to
+Naming/MethodParameterName:
+  Exclude:
+    - 'lib/youtube_rb/formatters.rb'
+# Offense count: 2
+RSpec/BeforeAfterAll:
+  Exclude:
+    - '**/spec/spec_helper.rb'
+    - '**/spec/rails_helper.rb'
+    - '**/spec/support/**/*.rb'
+    - 'spec/integration_spec.rb'
+# Offense count: 2
+# Configuration parameters: IgnoredMetadata.
+RSpec/DescribeClass:
+  Exclude:
+    - '**/spec/features/**/*'
+    - '**/spec/requests/**/*'
+    - '**/spec/routing/**/*'
+    - '**/spec/system/**/*'
+    - '**/spec/views/**/*'
+    - 'spec/integration_spec.rb'
+    - 'spec/settings_spec.rb'
+# Offense count: 30
+# Configuration parameters: CountAsOne.
+RSpec/ExampleLength:
+  Max: 22
+# Offense count: 4
+# This cop supports safe autocorrection (--autocorrect).
+RSpec/ExpectActual:
+  Exclude:
+    - '**/spec/routing/**/*'
+    - 'spec/integration_spec.rb'
+# Offense count: 2
+# Configuration parameters: Max, AllowedIdentifiers, AllowedPatterns.
+RSpec/IndexedLet:
+  Exclude:
+    - 'spec/transcript_spec.rb'
+# Offense count: 91
+RSpec/MultipleExpectations:
+  Max: 7
+# Offense count: 44
+# Configuration parameters: AllowSubject.
+RSpec/MultipleMemoizedHelpers:
+  Max: 11
+# Offense count: 3
+# Configuration parameters: AllowedGroups.
+RSpec/NestedGroups:
+  Max: 4
+# Offense count: 7
+# Configuration parameters: CustomTransform, IgnoreMethods, IgnoreMetadata, InflectorPath, EnforcedInflector.
+# SupportedInflectors: default, active_support
+RSpec/SpecFilePathFormat:
+  Exclude:
+    - '**/spec/routing/**/*'
+    - 'spec/api_spec.rb'
+    - 'spec/errors_spec.rb'
+    - 'spec/formatters_spec.rb'
+    - 'spec/transcript_list_fetcher_spec.rb'
+    - 'spec/transcript_list_spec.rb'
+    - 'spec/transcript_parser_spec.rb'
+    - 'spec/transcript_spec.rb'
+# Offense count: 10
+# Configuration parameters: IgnoreNameless, IgnoreSymbolicNames.
+RSpec/VerifiedDoubles:
+  Exclude:
+    - 'spec/api_spec.rb'
+    - 'spec/errors_spec.rb'
+    - 'spec/transcript_list_fetcher_spec.rb'
+    - 'spec/transcript_spec.rb'
+# Offense count: 1
+# Configuration parameters: AllowedConstants.
+Style/Documentation:
+  Exclude:
+    - 'spec/**/*'
+    - 'test/**/*'
+    - 'lib/youtube_rb/transcript.rb'
+# Offense count: 8
+# This cop supports safe autocorrection (--autocorrect).
+# Configuration parameters: EnforcedStyle, MaxUnannotatedPlaceholdersAllowed, Mode, AllowedMethods, AllowedPatterns.
+# SupportedStyles: annotated, template, unannotated
+Style/FormatStringToken:
+  Exclude:
+    - 'lib/youtube_rb/formatters.rb'
+# Offense count: 1168
+# This cop supports safe autocorrection (--autocorrect).
+# Configuration parameters: EnforcedStyle, ConsistentQuotesInMultiline.
+# SupportedStyles: single_quotes, double_quotes
+Style/StringLiterals:
+  Enabled: false
+# Offense count: 6
+# This cop supports safe autocorrection (--autocorrect).
+# Configuration parameters: AllowHeredoc, AllowURI, AllowQualifiedName, URISchemes, AllowRBSInlineAnnotation, AllowCopDirectives, AllowedPatterns, SplitStrings.
+# URISchemes: http, https
+Layout/LineLength:
+  Max: 142

data/README.md CHANGED Viewed

@@ -300,11 +300,11 @@ Here is how to import from the `Formatters` module:
 require 'youtube_rb/transcript'
 # Some provided formatter classes, each outputs a different string format.
-YoutubeRb::Transcript::Formatters::JSONFormatter
-YoutubeRb::Transcript::Formatters::TextFormatter
-YoutubeRb::Transcript::Formatters::PrettyPrintFormatter
-YoutubeRb::Transcript::Formatters::WebVTTFormatter
-YoutubeRb::Transcript::Formatters::SRTFormatter
+YoutubeRb::Formatters::JSONFormatter
+YoutubeRb::Formatters::TextFormatter
+YoutubeRb::Formatters::PrettyPrintFormatter
+YoutubeRb::Formatters::WebVTTFormatter
+YoutubeRb::Formatters::SRTFormatter
 ```
 ### Formatter Example
@@ -317,7 +317,7 @@ require 'youtube_rb/transcript'
 api = YoutubeRb::Transcript::YouTubeTranscriptApi.new
 transcript = api.fetch(video_id)
-formatter = YoutubeRb::Transcript::Formatters::JSONFormatter.new
+formatter = YoutubeRb::Formatters::JSONFormatter.new
 # .format_transcript(transcript) turns the transcript into a JSON string.
 json_formatted = formatter.format_transcript(transcript)
@@ -334,7 +334,7 @@ Since `JSONFormatter` leverages `JSON.generate` you can also forward keyword arg
 `.format_transcript(transcript)` such as making your file output prettier:
 ```ruby
-json_formatted = YoutubeRb::Transcript::Formatters::JSONFormatter.new.format_transcript(
+json_formatted = YoutubeRb::Formatters::JSONFormatter.new.format_transcript(
   transcript,
   indent: '  ',
   space: ' '
@@ -348,7 +348,7 @@ You can also use the `FormatterLoader` to dynamically load formatters by name:
 ```ruby
 require 'youtube_rb/transcript'
-loader = YoutubeRb::Transcript::Formatters::FormatterLoader.new
+loader = YoutubeRb::Formatters::FormatterLoader.new
 # Load by type name: "json", "pretty", "text", "webvtt", "srt"
 formatter = loader.load("json")
@@ -364,7 +364,7 @@ You can implement your own formatter class. Just inherit from the `Formatter` ba
 `format_transcript` and `format_transcripts` methods which should ultimately return a string:
 ```ruby
-class MyCustomFormatter < YoutubeRb::Transcript::Formatters::Formatter
+class MyCustomFormatter < YoutubeRb::Formatters::Formatter
   def format_transcript(transcript, **options)
     # Do your custom work in here, but return a string.
     'your processed output data as a string.'

data/lib/youtube-transcript-rb.rb ADDED Viewed

@@ -0,0 +1,4 @@
+# frozen_string_literal: true
+require_relative "youtube_rb/transcript"
+require_relative "youtube_rb/formatters"

data/lib/youtube_rb/formatters.rb ADDED Viewed

@@ -0,0 +1,263 @@
+# frozen_string_literal: true
+require "json"
+module YoutubeRb
+  # Module containing all transcript formatters
+  module Formatters
+    # Base formatter class. All formatters should inherit from this class
+    # and implement their own format_transcript and format_transcripts methods.
+    class Formatter
+      # Format a single transcript
+      #
+      # @param transcript [FetchedTranscript] The transcript to format
+      # @param options [Hash] Additional formatting options
+      # @return [String] The formatted transcript
+      def format_transcript(transcript, **options)
+        raise NotImplementedError, "Subclass must implement #format_transcript"
+      end
+      # Format multiple transcripts
+      #
+      # @param transcripts [Array<FetchedTranscript>] The transcripts to format
+      # @param options [Hash] Additional formatting options
+      # @return [String] The formatted transcripts
+      def format_transcripts(transcripts, **options)
+        raise NotImplementedError, "Subclass must implement #format_transcripts"
+      end
+    end
+    # Formats transcript as pretty-printed Ruby data structures
+    class PrettyPrintFormatter < Formatter
+      # Format a single transcript as pretty-printed output
+      #
+      # @param transcript [FetchedTranscript] The transcript to format
+      # @param options [Hash] Options passed to PP.pp
+      # @return [String] Pretty-printed transcript data
+      def format_transcript(transcript, **options)
+        require "pp"
+        PP.pp(transcript.to_raw_data, +"", options[:width] || 79)
+      end
+      # Format multiple transcripts as pretty-printed output
+      #
+      # @param transcripts [Array<FetchedTranscript>] The transcripts to format
+      # @param options [Hash] Options passed to PP.pp
+      # @return [String] Pretty-printed transcripts data
+      def format_transcripts(transcripts, **options)
+        require "pp"
+        data = transcripts.map(&:to_raw_data)
+        PP.pp(data, +"", options[:width] || 79)
+      end
+    end
+    # Formats transcript as JSON
+    class JSONFormatter < Formatter
+      # Format a single transcript as JSON
+      #
+      # @param transcript [FetchedTranscript] The transcript to format
+      # @param options [Hash] Options passed to JSON.generate (e.g., :indent, :space)
+      # @return [String] JSON representation of the transcript
+      def format_transcript(transcript, **options)
+        JSON.generate(transcript.to_raw_data, options)
+      end
+      # Format multiple transcripts as JSON array
+      #
+      # @param transcripts [Array<FetchedTranscript>] The transcripts to format
+      # @param options [Hash] Options passed to JSON.generate
+      # @return [String] JSON array representation of the transcripts
+      def format_transcripts(transcripts, **options)
+        data = transcripts.map(&:to_raw_data)
+        JSON.generate(data, options)
+      end
+    end
+    # Formats transcript as plain text (text only, no timestamps)
+    class TextFormatter < Formatter
+      # Format a single transcript as plain text
+      #
+      # @param transcript [FetchedTranscript] The transcript to format
+      # @param options [Hash] Unused options
+      # @return [String] Plain text with each line separated by newlines
+      def format_transcript(transcript, **options)
+        transcript.map(&:text).join("\n")
+      end
+      # Format multiple transcripts as plain text
+      #
+      # @param transcripts [Array<FetchedTranscript>] The transcripts to format
+      # @param options [Hash] Unused options
+      # @return [String] Plain text with transcripts separated by triple newlines
+      def format_transcripts(transcripts, **options)
+        transcripts.map { |t| format_transcript(t, **options) }.join("\n\n\n")
+      end
+    end
+    # Base class for timestamp-based formatters (SRT, WebVTT)
+    class TextBasedFormatter < TextFormatter
+      # Format a single transcript with timestamps
+      #
+      # @param transcript [FetchedTranscript] The transcript to format
+      # @param options [Hash] Unused options
+      # @return [String] Formatted transcript with timestamps
+      def format_transcript(transcript, **options)
+        lines = []
+        snippets = transcript.to_a
+        snippets.each_with_index do |snippet, i|
+          end_time = snippet.start + snippet.duration
+          # Use next snippet's start time if it starts before current end time
+          end_time = snippets[i + 1].start if i < snippets.length - 1 && snippets[i + 1].start < end_time
+          time_text = "#{seconds_to_timestamp(snippet.start)} --> #{seconds_to_timestamp(end_time)}"
+          lines << format_transcript_helper(i, time_text, snippet)
+        end
+        format_transcript_header(lines)
+      end
+      protected
+      # Format a timestamp from components
+      #
+      # @param hours [Integer] Hours component
+      # @param mins [Integer] Minutes component
+      # @param secs [Integer] Seconds component
+      # @param ms [Integer] Milliseconds component
+      # @return [String] Formatted timestamp
+      def format_timestamp(hours, mins, secs, ms)
+        raise NotImplementedError, "Subclass must implement #format_timestamp"
+      end
+      # Format the transcript header/wrapper
+      #
+      # @param lines [Array<String>] The formatted lines
+      # @return [String] The complete formatted transcript
+      def format_transcript_header(lines)
+        raise NotImplementedError, "Subclass must implement #format_transcript_header"
+      end
+      # Format a single transcript entry
+      #
+      # @param index [Integer] The entry index (0-based)
+      # @param time_text [String] The formatted time range
+      # @param snippet [TranscriptSnippet] The snippet to format
+      # @return [String] The formatted entry
+      def format_transcript_helper(index, time_text, snippet)
+        raise NotImplementedError, "Subclass must implement #format_transcript_helper"
+      end
+      private
+      # Convert seconds to timestamp string
+      #
+      # @param time [Float] Time in seconds
+      # @return [String] Formatted timestamp
+      def seconds_to_timestamp(time)
+        time = time.to_f
+        hours, remainder = time.divmod(3600)
+        mins, secs_float = remainder.divmod(60)
+        secs = secs_float.to_i
+        ms = ((time - time.to_i) * 1000).round
+        format_timestamp(hours.to_i, mins.to_i, secs, ms)
+      end
+    end
+    # Formats transcript as SRT (SubRip) subtitle format
+    #
+    # @example SRT format
+    #   1
+    #   00:00:00,000 --> 00:00:02,500
+    #   Hello world
+    #
+    #   2
+    #   00:00:02,500 --> 00:00:05,000
+    #   This is a test
+    #
+    class SRTFormatter < TextBasedFormatter
+      protected
+      def format_timestamp(hours, mins, secs, ms)
+        format("%02d:%02d:%02d,%03d", hours, mins, secs, ms)
+      end
+      def format_transcript_header(lines)
+        "#{lines.join("\n\n")}\n"
+      end
+      def format_transcript_helper(index, time_text, snippet)
+        "#{index + 1}\n#{time_text}\n#{snippet.text}"
+      end
+    end
+    # Formats transcript as WebVTT (Web Video Text Tracks) format
+    #
+    # @example WebVTT format
+    #   WEBVTT
+    #
+    #   00:00:00.000 --> 00:00:02.500
+    #   Hello world
+    #
+    #   00:00:02.500 --> 00:00:05.000
+    #   This is a test
+    #
+    class WebVTTFormatter < TextBasedFormatter
+      protected
+      def format_timestamp(hours, mins, secs, ms)
+        format("%02d:%02d:%02d.%03d", hours, mins, secs, ms)
+      end
+      def format_transcript_header(lines)
+        "WEBVTT\n\n#{lines.join("\n\n")}\n"
+      end
+      def format_transcript_helper(index, time_text, snippet)
+        "#{time_text}\n#{snippet.text}"
+      end
+    end
+    # Utility class to load formatters by type name
+    class FormatterLoader
+      # Mapping of format names to formatter classes
+      TYPES = {
+        "json" => JSONFormatter,
+        "pretty" => PrettyPrintFormatter,
+        "text" => TextFormatter,
+        "webvtt" => WebVTTFormatter,
+        "srt" => SRTFormatter
+      }.freeze
+      # Error raised when an unknown formatter type is requested
+      class UnknownFormatterType < StandardError
+        def initialize(formatter_type)
+          super(
+            "The format '#{formatter_type}' is not supported. " \
+            "Choose one of the following formats: #{TYPES.keys.join(', ')}"
+          )
+        end
+      end
+      # Load a formatter by type name
+      #
+      # @param formatter_type [String] The formatter type (json, pretty, text, webvtt, srt)
+      # @return [Formatter] An instance of the requested formatter
+      # @raise [UnknownFormatterType] If the formatter type is not supported
+      #
+      # @example
+      #   loader = FormatterLoader.new
+      #   formatter = loader.load("json")
+      #   output = formatter.format_transcript(transcript)
+      #
+      def load(formatter_type = "pretty")
+        formatter_type = formatter_type.to_s
+        raise UnknownFormatterType, formatter_type unless TYPES.key?(formatter_type)
+        TYPES[formatter_type].new
+      end
+    end
+  end
+end

data/lib/youtube_rb/transcript/api.rb CHANGED Viewed

@@ -113,17 +113,13 @@ module YoutubeRb
         results = {}
         video_ids.each do |video_id|
-          begin
-            transcript = fetch(video_id, languages: languages, preserve_formatting: preserve_formatting)
-            results[video_id] = transcript
-            yield(video_id, transcript) if block_given?
-          rescue CouldNotRetrieveTranscript => e
-            if continue_on_error
-              yield(video_id, e) if block_given?
-            else
-              raise
-            end
-          end
+          transcript = fetch(video_id, languages: languages, preserve_formatting: preserve_formatting)
+          results[video_id] = transcript
+          yield(video_id, transcript) if block_given?
+        rescue CouldNotRetrieveTranscript => e
+          raise unless continue_on_error
+          yield(video_id, e) if block_given?
         end
         results

data/lib/youtube_rb/transcript/errors.rb CHANGED Viewed

@@ -40,7 +40,7 @@ module YoutubeRb
       def github_referral
         "\n\nIf you are sure that the described cause is not responsible for this error " \
           "and that a transcript should be retrievable, please create an issue at " \
-          "https://github.com/jdepoix/youtube-transcript-api/issues. " \
+          "https://github.com/stadia/youtube-transcript-rb/issues. " \
           "Please add which version of youtube_transcript_api you are using " \
           "and provide the information needed to replicate the error. " \
           "Also make sure that there are no open issues which already describe your problem!"
@@ -131,13 +131,13 @@ module YoutubeRb
                       "2. (NOT RECOMMENDED) If you authenticate your requests using cookies, you " \
                       "will be able to continue doing requests for a while. However, YouTube will " \
                       "eventually permanently ban the account that you have used to authenticate " \
-                      "with! So only do this if you don't mind your account being banned!"
+                      "with! So only do this if you don't mind your account being banned!".freeze
     end
     # Raised when YouTube blocks the IP specifically
     class IpBlocked < RequestBlocked
       CAUSE_MESSAGE = "#{RequestBlocked::BASE_CAUSE_MESSAGE}" \
-                      "Ways to work around this are using proxies or rotating residential IPs."
+                      "Ways to work around this are using proxies or rotating residential IPs.".freeze
     end
     # Raised when too many requests are made (HTTP 429)

data/lib/youtube_rb/transcript/transcript.rb CHANGED Viewed

@@ -92,8 +92,8 @@ module YoutubeRb
       # Iterate over each snippet
       # @yield [TranscriptSnippet] each snippet in the transcript
-      def each(&block)
-        @snippets.each(&block)
+      def each(&)
+        @snippets.each(&)
       end
       # Get a snippet by index

data/lib/youtube_rb/transcript/transcript_list.rb CHANGED Viewed

@@ -69,11 +69,11 @@ module YoutubeRb
       #
       # @yield [TranscriptMetadata] each available transcript
       # @return [Enumerator] if no block given
-      def each(&block)
+      def each(&)
         return to_enum(:each) unless block_given?
-        @manually_created_transcripts.each_value(&block)
-        @generated_transcripts.each_value(&block)
+        @manually_created_transcripts.each_value(&)
+        @generated_transcripts.each_value(&)
       end
       # Find a transcript for the given language codes.

data/lib/youtube_rb/transcript/transcript_list_fetcher.rb CHANGED Viewed

@@ -56,10 +56,13 @@ module YoutubeRb
         innertube_data = fetch_innertube_data(video_id, api_key)
         extract_captions_json(innertube_data, video_id)
       rescue RequestBlocked => e
-        retries = @proxy_config.nil? ? 0 : (@proxy_config.respond_to?(:retries_when_blocked) ? @proxy_config.retries_when_blocked : 0)
-        if try_number + 1 < retries
-          return fetch_captions_json(video_id, try_number: try_number + 1)
-        end
+        retries = if @proxy_config.nil?
+                    0
+                  else
+                    (@proxy_config.respond_to?(:retries_when_blocked) ? @proxy_config.retries_when_blocked : 0)
+                  end
+        return fetch_captions_json(video_id, try_number: try_number + 1) if try_number + 1 < retries
         raise e
       end
@@ -72,11 +75,10 @@ module YoutubeRb
       # @raise [YouTubeDataUnparsable] if the key cannot be found
       def extract_innertube_api_key(html, video_id)
         match = html.match(/"INNERTUBE_API_KEY":\s*"([a-zA-Z0-9_-]+)"/)
-        if match && match[1]
-          return match[1]
-        end
+        return match[1] if match && match[1]
         raise IpBlocked, video_id if html.include?('class="g-recaptcha"')
         raise YouTubeDataUnparsable, video_id
       end
@@ -90,9 +92,7 @@ module YoutubeRb
         assert_playability(innertube_data["playabilityStatus"], video_id)
         captions_json = innertube_data.dig("captions", "playerCaptionsTracklistRenderer")
-        if captions_json.nil? || !captions_json.key?("captionTracks")
-          raise TranscriptsDisabled, video_id
-        end
+        raise TranscriptsDisabled, video_id if captions_json.nil? || !captions_json.key?("captionTracks")
         captions_json
       end
@@ -119,9 +119,8 @@ module YoutubeRb
         end
         if status == PlayabilityStatus::ERROR && reason == PlayabilityFailedReason::VIDEO_UNAVAILABLE
-          if video_id.start_with?("http://") || video_id.start_with?("https://")
-            raise InvalidVideoId, video_id
-          end
+          raise InvalidVideoId, video_id if video_id.start_with?("http://") || video_id.start_with?("https://")
           raise VideoUnavailable, video_id
         end
@@ -157,9 +156,7 @@ module YoutubeRb
         if html.include?('action="https://consent.youtube.com/s"')
           create_consent_cookie(html, video_id)
           html = fetch_html(video_id)
-          if html.include?('action="https://consent.youtube.com/s"')
-            raise FailedToCreateConsentCookie, video_id
-          end
+          raise FailedToCreateConsentCookie, video_id if html.include?('action="https://consent.youtube.com/s"')
         end
         html
@@ -195,9 +192,9 @@ module YoutubeRb
         response = @http_client.post(url) do |req|
           req.headers["Content-Type"] = "application/json"
           req.body = JSON.generate({
-            "context" => INNERTUBE_CONTEXT,
-            "videoId" => video_id
-          })
+                                     "context" => INNERTUBE_CONTEXT,
+                                     "videoId" => video_id
+                                   })
         end
         raise_http_errors(response, video_id)

data/lib/youtube_rb/transcript.rb CHANGED Viewed

@@ -1,6 +1,5 @@
 # frozen_string_literal: true
-require_relative "transcript/version"
 require_relative "transcript/settings"
 require_relative "transcript/errors"
 require_relative "transcript/transcript_parser"
@@ -8,7 +7,6 @@ require_relative "transcript/transcript"
 require_relative "transcript/transcript_list"
 require_relative "transcript/transcript_list_fetcher"
 require_relative "transcript/api"
-require_relative "transcript/formatters"
 module YoutubeRb
   module Transcript