RubyGems - sportdb-formats - Versions diffs - 1.0.5 → 1.1.3 - Mend

sportdb-formats 1.0.5 → 1.1.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (53) hide show

checksums.yaml +4 -4
data/Manifest.txt +8 -11
data/Rakefile +1 -1
data/lib/sportdb/formats.rb +19 -0
data/lib/sportdb/formats/country/country_index.rb +2 -2
data/lib/sportdb/formats/event/event_index.rb +141 -0
data/lib/sportdb/formats/event/event_reader.rb +183 -0
data/lib/sportdb/formats/league/league_index.rb +22 -18
data/lib/sportdb/formats/league/league_outline_reader.rb +27 -7
data/lib/sportdb/formats/league/league_reader.rb +7 -1
data/lib/sportdb/formats/match/mapper.rb +63 -63
data/lib/sportdb/formats/match/mapper_teams.rb +1 -1
data/lib/sportdb/formats/match/match_parser.rb +141 -193
data/lib/sportdb/formats/match/match_parser_csv.rb +169 -25
data/lib/sportdb/formats/match/match_status_parser.rb +86 -0
data/lib/sportdb/formats/name_helper.rb +4 -1
data/lib/sportdb/formats/package.rb +57 -9
data/lib/sportdb/formats/parser_helper.rb +11 -2
data/lib/sportdb/formats/score/score_formats.rb +19 -0
data/lib/sportdb/formats/score/score_parser.rb +10 -2
data/lib/sportdb/formats/season_utils.rb +0 -11
data/lib/sportdb/formats/structs/group.rb +5 -12
data/lib/sportdb/formats/structs/match.rb +7 -1
data/lib/sportdb/formats/structs/round.rb +6 -13
data/lib/sportdb/formats/structs/season.rb +114 -45
data/lib/sportdb/formats/structs/standings.rb +30 -9
data/lib/sportdb/formats/structs/team.rb +8 -2
data/lib/sportdb/formats/team/club_index.rb +13 -11
data/lib/sportdb/formats/team/club_index_history.rb +138 -0
data/lib/sportdb/formats/team/club_reader_history.rb +203 -0
data/lib/sportdb/formats/team/club_reader_props.rb +2 -3
data/lib/sportdb/formats/version.rb +2 -2
data/test/helper.rb +48 -81
data/test/test_club_index_history.rb +107 -0
data/test/test_club_reader_history.rb +212 -0
data/test/test_country_reader.rb +2 -2
data/test/test_datafile_package.rb +1 -1
data/test/test_match_status_parser.rb +49 -0
data/test/test_regex.rb +25 -7
data/test/test_scores.rb +2 -0
data/test/test_season.rb +68 -19
metadata +12 -15
data/test/test_conf.rb +0 -65
data/test/test_csv_match_parser.rb +0 -114
data/test/test_csv_match_parser_utils.rb +0 -20
data/test/test_match_auto.rb +0 -72
data/test/test_match_auto_champs.rb +0 -45
data/test/test_match_auto_euro.rb +0 -37
data/test/test_match_auto_worldcup.rb +0 -61
data/test/test_match_champs.rb +0 -27
data/test/test_match_eng.rb +0 -26
data/test/test_match_euro.rb +0 -27
data/test/test_match_worldcup.rb +0 -27

data/lib/sportdb/formats/league/league_index.rb CHANGED

@@ -95,36 +95,40 @@ class LeagueIndex
   end # method add
+  ## helper to always convert (possible) country key to existing country record
+  ##  todo: make private - why? why not?
+  def country( country )
+    if country.is_a?( String ) || country.is_a?( Symbol )
+      ## note:  use own "global" countries index setting for ClubIndex - why? why not?
+      rec = catalog.countries.find( country.to_s )
+      if rec.nil?
+        puts "** !!! ERROR !!! - unknown country >#{country}< - no match found, sorry - add to world/countries.txt in config"
+        exit 1
+      end
+      rec
+    else
+      country  ## (re)use country struct - no need to run lookup again
+    end
+  end
   def match( name )
-    ## todo/check: return empty array if no match!!! and NOT nil (add || []) - why? why not?
+    ## note: returns empty array if no match and NOT nil
     name = normalize( name )
-    @leagues_by_name[ name ]
+    @leagues_by_name[ name ] || []
   end
   def match_by( name:, country: )
     ## note: match must for now always include name
     m = match( name )
-    if m    ## filter by country
+    if country    ## filter by country
       ## note: country assumes / allows the country key or fifa code for now
       ## note: allow passing in of country struct too
-      country_rec = if country.is_a?( Country )
-                       country   ## (re)use country struct - no need to run lookup again
-                    else
-                       ## note:  use own "global" countries index setting for ClubIndex - why? why not?
-                       rec = catalog.countries.find( country )
-                       if rec.nil?
-                         puts "** !!! ERROR !!! - unknown country >#{country}< - no match found, sorry - add to world/countries.txt in config"
-                         exit 1
-                       end
-                       rec
-                    end
+      country_rec = country( country )
       ## note: also skip international leagues & cups (e.g. champions league etc.) for now - why? why not?
       m = m.select { |league| league.country &&
                               league.country.key == country_rec.key }
-      m = nil   if m.empty?     ## note: reset to nil if no more matches
     end
     m
   end
@@ -144,7 +148,7 @@ class LeagueIndex
     m = match( name )
     # pp m
-    if m.nil?
+    if m.empty?
       ## fall through/do nothing
     elsif m.size > 1
       puts "** !!! ERROR - ambigious league name; too many leagues (#{m.size}) found:"

data/lib/sportdb/formats/league/league_outline_reader.rb CHANGED

@@ -121,14 +121,34 @@ class LeagueOutlineReader   ## todo/check - rename to LeaguePageReader / LeagueP
     values
   end
-  def check_stage( name )
-    known_stages = ['regular season',
-                    'championship round',
-                    'relegation round',
-                    'play-offs'
-                   ]
-    if known_stages.include?( name.downcase )
+  # note: normalize names e.g. downcase and remove all non a-z chars (e.g. space, dash, etc.)
+  KNOWN_STAGES = [
+    'Regular Season',
+    'Regular Stage',
+    'Championship Round',
+    'Championship Playoff',  # or Championship play-off
+    'Relegation Round',
+    'Relegation Playoff',
+    'Play-offs',
+    'Playoff Stage',
+    'Grunddurchgang',
+    'Finaldurchgang - Qualifikationsgruppe',
+    'Finaldurchgang - Qualifikation',
+    'Finaldurchgang - Meistergruppe',
+    'Finaldurchgang - Meister',
+    'EL Play-off',
+    'Europa League Play-off',
+    'Europa-League-Play-offs',
+    'Playoffs - Championship',
+    'Playoffs - Relegation',
+    'Finals',
+  ].map {|name| name.downcase.gsub( /[^a-z]/, '' ) }
+  def check_stage( name )
+    # note: normalize names e.g. downcase and remove all non a-z chars (e.g. space, dash, etc.)
+    if KNOWN_STAGES.include?( name.downcase.gsub( /[^a-z]/, '' ) )
        ## everything ok
     else
       puts "** !!! ERROR - no (league) stage match found for >#{name}<, add to (builtin) stages table; sorry"

data/lib/sportdb/formats/league/league_reader.rb CHANGED

@@ -118,12 +118,18 @@ def parse
               alt_names_auto << "#{country.code}"    if league_key == '1'   ## add shortcut for top level 1 (just country key)
             end
             alt_names_auto << "#{country.name} #{league_key}"  if league_key =~ /^[0-9]+$/   ## if all numeric e.g. add Austria 1 etc.
+            ## auto-add with country prepended
+            ##   e.g. England Premier League, Austria Bundesliga etc.
+            ##  todo/check: also add variants with country alt name if present!!!
+            ##  todo/check: exclude cups or such from country + league name auto-add - why? why not?
+            alt_names_auto << "#{country.name} #{league_name}"
           else   ## assume int'l (no country) e.g. champions league, etc.
             ## only auto-add key (e.g. CL, EL, etc.)
             alt_names_auto << league_key.upcase.gsub('.', ' ')   ## note: no country code (prefix/leading) used
           end
-          pp alt_names_auto
+          ## pp alt_names_auto
           ## prepend country key/code if country present
           ##   todo/fix: only auto-prepend country if key/code start with a number (level) or incl. cup

data/lib/sportdb/formats/match/mapper.rb CHANGED

@@ -7,21 +7,21 @@ module SportDb
 ##   see https://github.com/textkit/textutils/blob/master/textutils/lib/textutils/title_mapper2.rb
-class MapperV2      ## todo/check: rename to NameMapper/TitleMapper ? why? why not??
+class MapperV2      ## todo/check: rename to NameMapper ? why? why not??
   include Logging
-  attr_reader :known_titles   ## rename to mapping or mappings or just titles - why? why not?
+  attr_reader :known_names   ## rename to mapping or mappings or just names - why? why not?
   ########
   ##  key:      e.g. augsburg
-  ##  title:    e.g. FC Augsburg
-  ##  length (of title(!!) - not regex pattern):   e.g. 11   -- do not count dots (e.g. U.S.A. => 3 or 6) why? why not?
-  MappingStruct =  Struct.new( :key, :title, :length, :pattern)     ## todo/check: use (rename to) TitleStruct - why? why not??
+  ##  name:     e.g. FC Augsburg
+  ##  length (of name(!!) - not regex pattern):   e.g. 11   -- do not count dots (e.g. U.S.A. => 3 or 6) why? why not?
+  MappingStruct =  Struct.new( :key, :name, :length, :pattern)     ## todo/check: use (rename to) NameStruct - why? why not??
   ######
   ## convenience helper - (auto)build ActiveRecord-like team records/structs
-  Record = Struct.new( :key, :title, :synonyms )
+  Record = Struct.new( :key, :name, :alt_names )
   def build_records( txt_or_lines )
     recs = []
@@ -44,12 +44,12 @@ class MapperV2      ## todo/check: rename to NameMapper/TitleMapper ? why? why n
       values = line.split( '|' )
       values = values.map { |value| value.strip }
-      title    = values[0]
+      name      = values[0]
       ## note: quick hack - auto-generate key, that is, remove all non-ascii chars and downcase
-      key      = title.downcase.gsub( /[^a-z]/, '' )
-      synonyms = values.size > 1 ? values[1..-1].join( '|' ) : nil
+      key       = name.downcase.gsub( /[^a-z]/, '' )
+      alt_names = values.size > 1 ? values[1..-1].join( '|' ) : nil
-      recs << Record.new( key, title, synonyms )
+      recs << Record.new( key, name, alt_names )
     end
     recs
   end
@@ -63,10 +63,10 @@ class MapperV2      ## todo/check: rename to NameMapper/TitleMapper ? why? why n
                                                                   (records_or_mapping.is_a?( Array ) && records_or_mapping[0].is_a?( String ))
     ## build mapping lookup table
-    @known_titles =  if records_or_mapping.is_a?( Hash )  ## assume "custom" mapping hash table (title/name=>record)
-                        build_title_table_for_mapping( records_or_mapping )
+    @known_names =  if records_or_mapping.is_a?( Hash )  ## assume "custom" mapping hash table (name=>record)
+                        build_name_table_for_mapping( records_or_mapping )
                      else  ## assume array of records
-                        build_title_table_for_records( records_or_mapping )
+                        build_name_table_for_records( records_or_mapping )
                      end
     ## build lookup hash by record (e.g. team/club/etc.) key
@@ -85,9 +85,9 @@ class MapperV2      ## todo/check: rename to NameMapper/TitleMapper ? why? why n
-  def map_titles!( line )   ## rename to just map! - why?? why not???
+  def map_names!( line )   ## rename to just map! - why?? why not???
     begin
-      found = map_title_for!( @tag, line, @known_titles )
+      found = map_name_for!( @tag, line, @known_names )
     end while found
   end
@@ -110,27 +110,27 @@ class MapperV2      ## todo/check: rename to NameMapper/TitleMapper ? why? why n
 private
-  def build_title_table_for_mapping( mapping )
-    known_titles = []
+  def build_name_table_for_mapping( mapping )
+    known_names = []
-    mapping.each do |title, rec|
+    mapping.each do |name, rec|
       m = MappingStruct.new
       m.key     = rec.key
-      m.title   = title
-      m.length  = title.length
-      m.pattern = Regexp.escape( title )   ## note: just use "standard" regex escape (e.g. no extras for umlauts,accents,etc.)
+      m.name    = name
+      m.length  = name.length
+      m.pattern = Regexp.escape( name )   ## note: just use "standard" regex escape (e.g. no extras for umlauts,accents,etc.)
-      known_titles << m
+      known_names << m
     end
     ## note: sort here by length (largest goes first - best match)
-    known_titles = known_titles.sort { |l,r| r.length <=> l.length }
-    known_titles
+    known_names = known_names.sort { |l,r| r.length <=> l.length }
+    known_names
   end
-  def build_title_table_for_records( records )
+  def build_name_table_for_records( records )
-    ## build known tracks table w/ synonyms e.g.
+    ## build known tracks table w/ alt names e.g.
     #
     # [[ 'wolfsbrug', 'VfL Wolfsburg'],
     #  [ 'augsburg',  'FC Augsburg'],
@@ -138,65 +138,65 @@ private
     #  [ 'augsburg',  'Augi3' ],
     #  [ 'stuttgart', 'VfB Stuttgart']]
-    known_titles = []
+    known_names = []
     records.each_with_index do |rec,index|
-      title_candidates = []
-      title_candidates << rec.title
+      name_candidates = []
+      name_candidates << rec.name
-      title_candidates += rec.synonyms.split('|') if rec.synonyms && !rec.synonyms.empty?
+      name_candidates += rec.alt_names.split('|') if rec.alt_names && !rec.alt_names.empty?
-      ## check if title includes subtitle e.g. Grand Prix Japan (Suzuka Circuit)
-      #  make subtitle optional by adding title w/o subtitle e.g. Grand Prix Japan
+      ## check if name includes subname e.g. Grand Prix Japan (Suzuka Circuit)
+      #  make subname optional by adding name w/o subname e.g. Grand Prix Japan
-      titles = []
-      title_candidates.each do |t|
-        titles << t
+      names = []
+      name_candidates.each do |t|
+        names << t
         if t =~ /\(.+\)/
-          extra_title = t.gsub( /\(.+\)/, '' ) # remove/delete subtitles
+          extra_name = t.gsub( /\(.+\)/, '' ) # remove/delete subnames
           # note: strip leading n trailing withspaces too!
           #  -- todo: add squish or something if () is inline e.g. leaves two spaces?
-          extra_title.strip!
-          titles << extra_title
+          extra_name.strip!
+          names << extra_name
         end
       end
-      titles.each do |t|
+      names.each do |name|
         m = MappingStruct.new
         m.key     = rec.key
-        m.title   = t
-        m.length  = t.length
+        m.name    = name
+        m.length  = name.length
         ## note: escape for regex plus allow subs for special chars/accents
-        m.pattern = title_esc_regex( t )
+        m.pattern = name_esc_regex( name )
-        known_titles << m
+        known_names << m
       end
-      logger.debug "  #{rec.class.name}[#{index+1}] #{rec.key} >#{titles.join('|')}<"
+      logger.debug "  #{rec.class.name}[#{index+1}] #{rec.key} >#{names.join('|')}<"
       ## note: only include code field - if defined
       if rec.respond_to?(:code) && rec.code && !rec.code.empty?
         m = MappingStruct.new
         m.key     = rec.key
-        m.title   = rec.code
+        m.name    = rec.code
         m.length  = rec.code.length
         m.pattern = rec.code   ## note: use code for now as is (no variants allowed fow now)
-        known_titles << m
+        known_names << m
       end
     end
     ## note: sort here by length (largest goes first - best match)
       #  exclude code and key (key should always go last)
-    known_titles = known_titles.sort { |l,r| r.length <=> l.length }
-    known_titles
+    known_names = known_names.sort { |l,r| r.length <=> l.length }
+    known_names
   end
-  def map_title_for!( tag, line, mappings )
+  def map_name_for!( tag, line, mappings )
     mappings.each do |mapping|
       key     = mapping.key
       pattern = mapping.pattern
@@ -234,9 +234,9 @@ private
 ####
-# title helper cut-n-paste copy from TextUtils
+# name helper cut-n-paste copy from TextUtils
 ##  see https://github.com/textkit/textutils/blob/master/textutils/lib/textutils/helper/title_helper.rb
-def title_esc_regex( title_unescaped )
+def name_esc_regex( name_unescaped )
       ##  escape regex special chars e.g.
       #    . to \. and
@@ -257,16 +257,16 @@ def title_esc_regex( title_unescaped )
       # e.g. Club Atlético Colón (Santa Fe)
       # e.g. Bauer Anton (????)
-      ## NB: cannot use Regexp.escape! will escape space '' to '\ '
-      ## title = Regexp.escape( title_unescaped )
-      title = title_unescaped.gsub( '.', '\.' )
-      title = title.gsub( '(', '\(' )
-      title = title.gsub( ')', '\)' )
-      title = title.gsub( '?', '\?' )
-      title = title.gsub( '*', '\*' )
-      title = title.gsub( '+', '\+' )
-      title = title.gsub( '$', '\$' )
-      title = title.gsub( '^', '\^' )
+      ## note: cannot use Regexp.escape! will escape space '' to '\ '
+      ## name = Regexp.escape( name_unescaped )
+      name = name_unescaped.gsub( '.', '\.' )
+      name = name.gsub( '(', '\(' )
+      name = name.gsub( ')', '\)' )
+      name = name.gsub( '?', '\?' )
+      name = name.gsub( '*', '\*' )
+      name = name.gsub( '+', '\+' )
+      name = name.gsub( '$', '\$' )
+      name = name.gsub( '^', '\^' )
       ##  match accented char with or without accents
       ##  add (ü|ue) etc.
@@ -309,10 +309,10 @@ def title_esc_regex( title_unescaped )
       ##   collect some more (real-world) examples first!!!!!
       alternatives.each do |alt|
-        title = title.gsub( alt[0], alt[1] )
+        name = name.gsub( alt[0], alt[1] )
       end
-      title
+      name
   end
 end # class MapperV2

data/lib/sportdb/formats/match/mapper_teams.rb CHANGED

@@ -16,7 +16,7 @@ class TeamMapper
   end
   def map_teams!( line )
-    @mapper.map_titles!( line )
+    @mapper.map_names!( line )
   end
 end # class TeamMapper

data/lib/sportdb/formats/match/match_parser.rb CHANGED

@@ -82,15 +82,14 @@ class MatchParser   ## simple match parser for team match schedules
     #    team1 team2 - match  (will get new auto-matchday! not last round)
     @last_round     = nil
-    title, pos = find_group_title_and_pos!( line )
+    name = find_group_name!( line )
-    logger.debug "    title: >#{title}<"
-    logger.debug "    pos: >#{pos}<"
+    logger.debug "    name: >#{name}<"
     logger.debug "  line: >#{line}<"
-    group = @groups[ title ]
+    group = @groups[ name ]
     if group.nil?
-      puts "!! ERROR - no group def found for >#{title}<"
+      puts "!! ERROR - no group def found for >#{name}<"
       exit 1
     end
@@ -104,19 +103,19 @@ class MatchParser   ## simple match parser for team match schedules
     @mapper_teams.map_teams!( line )
     teams = @mapper_teams.find_teams!( line )
-    title, pos = find_group_title_and_pos!( line )
+    name = find_group_name!( line )
     logger.debug "  line: >#{line}<"
-    group = Import::Group.new( pos: pos,
-                               title: title,
-                               teams: teams.map {|team| team.title } )
+    ## todo/check/fix: add back group key - why? why not?
+    group = Import::Group.new( name:  name,
+                               teams: teams.map {|team| team.name } )
-    @groups[ title ] = group
+    @groups[ name ] = group
   end
-  def find_group_title_and_pos!( line )
+  def find_group_name!( line )
     ## group pos - for now support single digit e.g 1,2,3 or letter e.g. A,B,C or HEX
     ## nb:  (?:)  = is for non-capturing group(ing)
@@ -125,37 +124,25 @@ class MatchParser   ## simple match parser for team match schedules
     ## todo:
     ##   check if Group A:  or [Group A]  works e.g. : or ] get matched by \b ???
-    regex = /(?:Group|Gruppe|Grupo)\s+((?:\d{1}|[A-Z]{1,3}))\b/
+    regex = /\b
+              (?:
+                (Group | Gruppe | Grupo)
+                   [ ]+
+                (\d+ | [A-Z]+)
+              )
+            \b/x
     m = regex.match( line )
-    return [nil,nil] if m.nil?
-    pos = case m[1]
-          when 'A' then 1
-          when 'B' then 2
-          when 'C' then 3
-          when 'D' then 4
-          when 'E' then 5
-          when 'F' then 6
-          when 'G' then 7
-          when 'H' then 8
-          when 'I' then 9
-          when 'J' then 10
-          when 'K' then 11
-          when 'L' then 12
-          when 'HEX' then 666    # HEX for Hexagonal - todo/check: map to something else ??
-          else  m[1].to_i
-          end
+    return nil    if m.nil?
-    title = m[0]
+    name = m[0]
-    logger.debug "   title: >#{title}<"
-    logger.debug "   pos: >#{pos}<"
+    logger.debug "   name: >#{name}<"
-    line.sub!( regex, '[GROUP.TITLE+POS]' )
+    line.sub!( name, '[GROUP.NAME]' )
-    [title,pos]
+    name
   end
@@ -180,198 +167,130 @@ class MatchParser   ## simple match parser for team match schedules
     end_date   = end_date.to_date
-    pos   = find_round_pos!( line )
-    title = find_round_def_title!( line )
-    # NB: use extracted round title for knockout check
-    knockout_flag = is_knockout_round?( title )
+    name  = find_round_def_name!( line )
+    # NB: use extracted round name for knockout check
+    knockout_flag = is_knockout_round?( name )
     logger.debug "    start_date: #{start_date}"
     logger.debug "    end_date:   #{end_date}"
-    logger.debug "    pos:      #{pos}"
-    logger.debug "    title:    >#{title}<"
+    logger.debug "    name:    >#{name}<"
     logger.debug "    knockout_flag:   #{knockout_flag}"
     logger.debug "  line: >#{line}<"
-    #######################################
-    # todo/fix: add auto flag is false !!!! - why? why not?
-    round = Import::Round.new( pos:        pos,
-                               title:      title,
+    round = Import::Round.new( name:       name,
                                start_date: start_date,
                                end_date:   end_date,
                                knockout:   knockout_flag,
                                auto:       false )
-    @rounds[ title ] = round
+    @rounds[ name ] = round
   end
-  def find_round_pos!( line )
-    # pass #1) extract optional round pos from line
-    # e.g.  (1)   - must start line
-    regex_pos = /^[ \t]*\((\d{1,3})\)[ \t]+/
-    # pass #2) find free standing number  e.g. Matchday 3 or Round 5 or 3. Spieltag etc.
-    # note: /\b(\d{1,3})\b/
-    #   will match -12
-    #  thus, use space required - will NOT match  -2 e.g. Group-2 Play-off
-    #  note:  allow  1. Runde  n
-    #                1^ Giornata
-    regex_num = /(?:^|\s)(\d{1,3})(?:[.\^\s]|$)/
-    if line =~ regex_pos
-      logger.debug "   pos: >#{$1}<"
-      line.sub!( regex_pos, '[ROUND.POS] ' )  ## NB: add back trailing space that got swallowed w/ regex -> [ \t]+
-      return $1.to_i
-    elsif line =~ regex_num
-      ## assume number in title is pos (e.g. Jornada 3, 3 Runde etc.)
-      ## NB: do NOT remove pos from string (will get removed by round title)
-      num = $1.to_i  # note: clone capture; keep a copy (another regex follows; will redefine $1)
-      #### fix:
-      #  use/make keywords required
-      #  e.g. Round of 16  -> should NOT match 16!
-      #    Spiel um Platz 3  (or 5) etc -> should NOT match 3!
-      #  Round 16 - ok
-      #  thus, check for required keywords
-      ## quick hack for round of 16
-      # todo: mask match e.g. Round of xxx ... and try again - might include something
-      #  reuse pattern for Group XX Replays for example
-      if line =~ /^\s*Round of \d{1,3}\b/
-         return nil
-      end
-      logger.debug "   pos: >#{num}<"
-      return num
-    else
-      ## fix: add logger.warn no round pos found in line
-      return nil
-    end
-  end # method find_round_pos!
-  def find_round_def_title!( line )
-    # assume everything before pipe (\) is the round title
-    #  strip [ROUND.POS],  todo:?? [ROUND.TITLE2]
+  def find_round_def_name!( line )
+    # assume everything before pipe (\) is the round name
+    #  strip [ROUND.POS],  todo:?? [ROUND.NAME2]
-    # todo/fix: add title2 w/  // or /  why? why not?
+    # todo/fix: add name2 w/  // or /  why? why not?
     #  -- strip / or / chars
     buf = line.dup
-    logger.debug "  find_round_def_title! line-before: >>#{buf}<<"
+    logger.debug "  find_round_def_name! line-before: >>#{buf}<<"
     ## cut-off everything after (including) pipe (|)
     buf = buf[ 0...buf.index('|') ]
-    # e.g. remove [ROUND.POS], [ROUND.TITLE2], [GROUP.TITLE+POS] etc.
-    buf.gsub!( /\[[^\]]+\]/, '' )    ## fix: use helper for (re)use e.g. remove_match_placeholder/marker or similar?
-    # remove leading and trailing whitespace
     buf.strip!
-    logger.debug "  find_round_def_title! line-after: >>#{buf}<<"
+    logger.debug "  find_round_def_name! line-after: >>#{buf}<<"
-    logger.debug "   title: >>#{buf}<<"
-    line.sub!( buf, '[ROUND.TITLE]' )
+    logger.debug "   name: >>#{buf}<<"
+    line.sub!( buf, '[ROUND.NAME]' )
     buf
   end
-  def find_round_header_title!( line )
-    # assume everything left is the round title
-    #  extract all other items first (round title2, round pos, group title n pos, etc.)
-    ## todo/fix:
-    ##  cleanup method
-    ##   use  buf.index( '//' ) to split string (see found_round_def)
-    ##     why? simpler why not?
-    ##  - do we currently allow groups if title2 present? add example if it works?
+    ##  split by or || or |||
+    ##           or ++ or +++
+    ##           or -- or ---
+    ##           or // or ///
+    ##  note: allow Final | First Leg  as ONE name same as
+    ##              Final - First Leg or
+    ##              Final, First Leg
+    ##   for cut-off always MUST be more than two chars
+    ##
+    ##  todo/check: find a better name than HEADER_SEP(ARATOR) - why? why not?
+    ##   todo/fix: move to parser utils and add a method split_name or such?
+    HEADER_SEP_RE = /  [ ]*      ## allow (strip) leading spaces
+                      (?:\|{2,} |
+                          \+{2,} |
+                           -{2,} |
+                          \/{2,}
+                      )
+                      [ ]*       ## allow (strip) trailing spaces
+                  /x
+  def find_round_header_name!( line )
+    # assume everything left is the round name
+    #  extract all other items first (round name2, round pos, group name n pos, etc.)
     buf = line.dup
-    logger.debug "  find_round_header_title! line-before: >>#{buf}<<"
+    logger.debug "  find_round_header_name! line-before: >>#{buf}<<"
+    parts = buf.split( HEADER_SEP_RE )
+    buf = parts[0]
-    buf.gsub!( /\[[^\]]+\]/, '' )   # e.g. remove [ROUND.POS], [ROUND.TITLE2], [GROUP.TITLE+POS] etc.
     buf.strip!    # remove leading and trailing whitespace
-    logger.debug "  find_round_title! line-after: >>#{buf}<<"
+    logger.debug "  find_round_name! line-after: >>#{buf}<<"
-    ### bingo - assume what's left is the round title
+    ### bingo - assume what's left is the round name
-    logger.debug "   title: >>#{buf}<<"
-    line.sub!( buf, '[ROUND.TITLE]' )
+    logger.debug "   name: >>#{buf}<<"
+    line.sub!( buf, '[ROUND.NAME]' )
     buf
   end
+    ## quick hack- collect all "fillwords" by language!!!!
+    ##    change later  and add to sportdb-langs!!!!
+    ##
+    ##    strip all "fillwords" e.g.:
+    ##      Nachtrag/Postponed/Addition/Supplemento names
+    ##
+    ##  todo/change: find a better name for ROUND_EXTRA_WORDS - why? why not?
+    ROUND_EXTRA_WORDS_RE = /\b(?:
+                               Nachtrag |     ## de
+                               Postponed |    ## en
+                               Addition  |    ## en
+                               Supplemento    ## es
+                              )
+                             \b/ix
   def parse_round_header( line )
     logger.debug "parsing round header line: >#{line}<"
-    ## todo/check/fix:
-    #   make sure  Round of 16  will not return pos 16 -- how? possible?
-    #   add unit test too to verify
-    pos = find_round_pos!( line )
-    title = find_round_header_title!( line )
+    name = find_round_header_name!( line )
     logger.debug "  line: >#{line}<"
+    name = name.sub( ROUND_EXTRA_WORDS_RE, '' )
+    name = name.strip
-    round = @rounds[ title ]
+    round = @rounds[ name ]
     if round.nil?    ## auto-add / create if missing
-      round = Import::Round.new( pos:   pos,
-                                 title: title )
-      @rounds[ title ] = round
+      ## todo/check: add num (was pos) if present - why? why not?
+      round = Import::Round.new( name: name )
+      @rounds[ name ] = round
     end
     ## todo/check: if pos match (MUST always match for now)
     @last_round = round
     @last_group = nil   # note: reset group to no group - why? why not?
-    ## NB: dummy/placeholder start_at, end_at date
-    ##  replace/patch after adding all games for round
-=begin
-    round_attribs = {
-      title:  title,
-      title2: title2,
-      knockout: knockout_flag
-    }
-    if pos > 999000
-      # no pos (e.g. will get autonumbered later) - try match by title for now
-      #  e.g. lets us use title 'Group Replays', for example, multiple times
-      @round = Round.find_by_event_id_and_title( @event.id, title )
-    else
-      @round = Round.find_by_event_id_and_pos( @event.id, pos )
-    end
-    if @round.present?
-      logger.debug "update round #{@round.id}:"
-    else
-      logger.debug "create round:"
-      @round = Round.new
-      round_attribs = round_attribs.merge( {
-        event_id: @event.id,
-        pos:   pos,
-        start_at: Date.parse('1911-11-11'),
-        end_at:   Date.parse('1911-11-11')
-      })
-    end
-    logger.debug round_attribs.to_json
-    @round.update_attributes!( round_attribs )
-    @patch_round_ids_pos   << @round.id    if pos > 999000
-    ### store list of round ids for patching start_at/end_at at the end
-    @patch_round_ids_dates << @round.id   # todo/fix/check: check if round has definition (do NOT patch if definition (not auto-added) present)
-=end
   end
@@ -383,6 +302,11 @@ class MatchParser   ## simple match parser for team match schedules
     ScoreFormats.find!( line )
   end
+  def find_status!( line )
+    StatusParser.find!( line )
+  end
   def try_parse_game( line )
     # note: clone line; for possible test do NOT modify in place for now
     # note: returns true if parsed, false if no match
@@ -410,6 +334,10 @@ class MatchParser   ## simple match parser for team match schedules
       return false
     end
+    ## find (optional) match status e.g. [abandoned] or [replay] or [awarded]
+    ##                                   or [cancelled] or [postponed] etc.
+    status = find_status!( line )   ## todo/check: allow match status also in geo part (e.g. after @) - why? why not?
     ## pos = find_game_pos!( line )
       date      = find_date!( line, start: @start )
@@ -434,20 +362,23 @@ class MatchParser   ## simple match parser for team match schedules
     if @last_round
       round = @last_round
     else
-      ## find (first) matching round by date
-      @rounds.values.each do |round_rec|
-        ## note: convert date to date only (no time) with to_date!!!
-        if (round_rec.start_date && round_rec.end_date) &&
-           (date.to_date >= round_rec.start_date &&
-            date.to_date <= round_rec.end_date)
-          round = round_rec
-          break
+      ## find (first) matching round by date if rounds / matchdays defined
+      ##   if not rounds / matchdays defined - YES, allow matches WITHOUT rounds!!!
+      if @rounds.size > 0
+        @rounds.values.each do |round_rec|
+          ## note: convert date to date only (no time) with to_date!!!
+          if (round_rec.start_date && round_rec.end_date) &&
+             (date.to_date >= round_rec.start_date &&
+             date.to_date <= round_rec.end_date)
+            round = round_rec
+            break
+          end
+        end
+        if round.nil?
+          puts "!! ERROR - no matching round found for match date:"
+          pp date
+          exit 1
         end
-      end
-      if round.nil?
-        puts "!! ERROR - no matching round found for match date:"
-        pp date
-        exit 1
       end
     end
@@ -457,12 +388,12 @@ class MatchParser   ## simple match parser for team match schedules
     ## todo/check: pass along round and group refs or just string (canonical names) - why? why not?
     @matches << Import::Match.new( date:    date,
-                                   team1:   team1,  ## note: for now always use mapping value e.g. rec (NOT string e.g. team1.title)
-                                   team2:   team2,  ## note: for now always use mapping value e.g. rec (NOT string e.g. team2.title)
+                                   team1:   team1,  ## note: for now always use mapping value e.g. rec (NOT string e.g. team1.name)
+                                   team2:   team2,  ## note: for now always use mapping value e.g. rec (NOT string e.g. team2.name)
                                    score:   score,
-                                   round:   round       ? round.title       : nil,   ## note: for now always use string (assume unique canonical name for event)
-                                   group:   @last_group ? @last_group.title : nil )  ## note: for now always use string (assume unique canonical name for event)
+                                   round:   round       ? round.name       : nil,   ## note: for now always use string (assume unique canonical name for event)
+                                   group:   @last_group ? @last_group.name : nil,   ## note: for now always use string (assume unique canonical name for event)
+                                   status:  status )
     ### todo: cache team lookups in hash?
 =begin
@@ -517,7 +448,7 @@ class MatchParser   ## simple match parser for team match schedules
         round_attribs = {
           event_id: @event.id,
-          title: "Matchday #{date.to_date}",
+          name: "Matchday #{date.to_date}",
           pos: 999001+@patch_round_ids_pos.length,   # e.g. 999<count> - 999001,999002,etc.
           start_at:  date.to_date,
           end_at:    date.to_date
@@ -541,7 +472,7 @@ class MatchParser   ## simple match parser for team match schedules
       end
       ## note: will crash (round.pos) if round is nil
-      logger.debug( "  using round #{round.pos} >#{round.title}< start_at: #{round.start_at}, end_at: #{round.end_at}" )
+      logger.debug( "  using round #{round.pos} >#{round.name}< start_at: #{round.start_at}, end_at: #{round.end_at}" )
     else
       ## use round from last round header
       round = @round
@@ -644,12 +575,29 @@ class MatchParser   ## simple match parser for team match schedules
     if date && team1.nil? && team2.nil?
       logger.debug( "date header line found: >#{line}<")
-      logger.debug( "    date: #{date}")
+      logger.debug( "    date: #{date} with start: #{@start}")
       @last_date = date   # keep a reference for later use
-      return true
+      ###  quick "corona" hack - support seasons going beyond 12 month (see swiss league 2019/20 and others!!)
+      ##    find a better way??
+      ##  set @start date to full year (e.g. 1.1.) if date.year  is @start.year+1
+      ##   todo/fix: add to linter to check for chronological dates!! - warn if NOT chronological
+      ###  todo/check: just turn on for 2019/20 season or always? why? why not?
+      ## todo/fix: add switch back to old @start_org
+      ##   if year is date.year == @start.year-1    -- possible when full date with year set!!!
+      if @start.month != 1
+         if date.year == @start.year+1
+           logger.debug( "!! hack - extending start date to full (next/end) year; assumes all dates are chronologigal - always moving forward" )
+           @start_org = @start   ## keep a copy of the original (old) start date - why? why not? - not used for now
+           @start = Date.new( @start.year+1, 1, 1 )
+         end
+      end
+      true
     else
-      return false
+      false
     end
   end