RubyGems - sunflower - Versions diffs - 0.2 - Mend

sunflower 0.2

Files changed (25) hide show

data/LICENSE +4 -0
data/README +21 -0
data/bin/sunflower-setup +68 -0
data/example-bot.rb +12 -0
data/lib/sunflower/commontasks.rb +251 -0
data/lib/sunflower/core.rb +253 -0
data/lib/sunflower/listmaker.rb +152 -0
data/lib/sunflower.rb +4 -0
data/scripts/ZDBOT.rb +62 -0
data/scripts/aktualizacjapilkarzy.rb +339 -0
data/scripts/author-list.rb +36 -0
data/scripts/changeimage.rb +42 -0
data/scripts/fix-bold-in-headers.rb +53 -0
data/scripts/fix-double-pipes.rb +49 -0
data/scripts/fix-langs.rb +43 -0
data/scripts/fix-multiple-same-refs.rb +102 -0
data/scripts/fix-some-entities.rb +43 -0
data/scripts/fix-unicode-control-chars.rb +51 -0
data/scripts/insight.rb +133 -0
data/scripts/lekkoatl-portal.rb +51 -0
data/scripts/make-id2team-list.rb +32 -0
data/scripts/recat.rb +32 -0
data/scripts/wanted.rb +72 -0
data/use-easy-bot.rb +54 -0
metadata +115 -0

data/lib/sunflower/listmaker.rb ADDED Viewed

@@ -0,0 +1,152 @@
+# coding: utf-8
+class Sunflower
+	# Makes a list of articles. Returns array of titles.
+	def make_list type, *parameters
+		type=type.downcase.gsub(/[^a-z]/, '')
+		first=parameters[0]
+		firstE=CGI.escape first
+		case type
+		when 'file'
+			f=File.open first
+			list=f.read.sub(/\357\273\277/,'').strip.split(/\r?\n/)
+			f.close
+		when 'page', 'pages'
+			list=parameters
+		when 'input'
+			puts 'Insert titles of articles to edit:'
+			puts 'Press [Enter] without inputting any text to finish.'
+			puts 'Press [Ctrl]+[C] to kill bot.'
+			list=[]
+			while true
+				input=gets.strip
+				break if input==''
+				list<<input
+			end
+		when 'categorieson'
+			r=self.API('action=query&prop=categories&cllimit=500&titles='+firstE)
+			list=r['query']['pages'].first['categories'].map{|v| v['title']} #extract titles
+		when 'category'
+			r=self.API('action=query&list=categorymembers&cmprop=title&cmlimit=5000&cmtitle='+firstE)
+			list=r['query']['categorymembers'].map{|v| v['title']} #extract titles
+		when 'categoryr', 'categoryrecursive'
+			list=[] #list of articles
+			catsToProcess=[first] #list of categories to be processes
+			while !catsToProcess.empty?
+				list2=self.make_list('category',catsToProcess[0]) # get contents of first cat in list
+				catsToProcess=catsToProcess+list2.select{|el| el=~/\AKategoria:/} # find categories in it and queue them to be processes
+				catsToProcess.delete_at 0 # remove first category from list
+				list=list+list2 #add articles to main list
+			end
+			list.uniq! #remove dupes
+		when 'linkson'
+			r=self.API('action=query&prop=links&pllimit=5000&titles='+firstE)
+			list=r['query']['pages'].first['links'].map{|v| v['title']} #extract titles
+		when 'transclusionson', 'templateson'
+			r=self.API('action=query&prop=templates&tllimit=5000&titles='+firstE)
+			list=r['query']['pages'].first['templates'].map{|v| v['title']} #extract titles
+		when 'usercontribs', 'contribs'
+			r=self.API('action=query&list=usercontribs&uclimit=5000&ucprop=title&ucuser='+firstE)
+			list=r['query']['usercontribs'].map{|v| v['title']} #extract titles
+		when 'whatlinksto', 'whatlinkshere'
+			r=self.API('action=query&list=backlinks&bllimit=5000&bltitle='+firstE)
+			list=r['query']['backlinks'].map{|v| v['title']} #extract titles
+		when 'whattranscludes', 'whatembeds'
+			r=self.API('action=query&list=embeddedin&eilimit=5000&eititle='+firstE)
+			list=r['query']['embeddedin'].map{|v| v['title']} #extract titles
+		when 'image', 'imageusage'
+			r=self.API('action=query&list=imageusage&iulimit=5000&iutitle='+firstE)
+			list=r['query']['imageusage'].map{|v| v['title']} #extract titles
+		when 'search'
+			r=self.API('action=query&list=search&srwhat=text&srlimit=5000&srnamespace='+(parameters[1]=='allns' ? CGI.escape('0|1|2|3|4|5|6|7|8|9|10|11|12|13|14|15|100|101|102|103') : '0')+'&srsearch='+firstE)
+			list=r['query']['search'].map{|v| v['title']} #extract titles
+		when 'searchtitles'
+			r=self.API('action=query&list=search&srwhat=title&srlimit=5000&srnamespace='+(parameters[1]=='allns' ? CGI.escape('0|1|2|3|4|5|6|7|8|9|10|11|12|13|14|15|100|101|102|103') : '0')+'&srsearch='+firstE)
+			list=r['query']['search'].map{|v| v['title']} #extract titles
+		when 'random'
+			r=self.API('action=query&list=random&rnnamespace=0&rnlimit='+first.gsub(/\D/))
+			list=r['query']['random'].map{|v| v['title']} #extract titles
+		when 'external', 'linksearch'
+			r=self.API('action=query&euprop=title&list=exturlusage&eulimit=5000&euquery='+firstE)
+			list=r['query']['exturlusage'].map{|v| v['title']} #extract titles
+		when 'google'
+			limit=[parameters[1].to_i,999].min
+			from=0
+			list=[]
+			while from<limit
+				p=HTTP.get(URI.parse("http://www.google.pl/custom?q=kot&start=#{from}&sitesearch=#{@wikiURL}"))
+				p.scan(/<div class=g><h2 class=r><a href="http:\/\/#{@wikiURL}\/wiki\/([^#<>\[\]\|\{\}]+?)" class=l>/){
+					list<<CGI.unescape($1).gsub('_',' ')
+				}
+				from+=10
+			end
+		when 'grep', 'regex', 'regexp'
+			split=@wikiURL.split('.')
+			ns=(parameters[1] ? parameters[1].to_s.gsub(/\D/,'') : '0')
+			redirs=(parameters[2] ? '&redirects=on' : '')
+			list=[]
+			p=HTTP.get(URI.parse("http://toolserver.org/~nikola/grep.php?pattern=#{firstE}&lang=#{split[0]}&wiki=#{split[1]}&ns=#{ns}#{redirs}"))
+			p.scan(/<tr><td><a href="http:\/\/#{@wikiURL}\/wiki\/([^#<>\[\]\|\{\}]+?)(?:\?redirect=no|)">/){
+				list<<CGI.unescape($1).gsub('_',' ')
+			}
+		end
+		return list
+	end
+end
+if $0==__FILE__
+	puts 'What kind of list do you want to create?'
+	if !(t=ARGV.shift)
+		t=gets
+	else
+		t=t.strip
+		puts t
+	end
+	puts ''
+	puts 'Supply arguments to pass to listmaker:'
+	puts '(press [Enter] without writing anything to finish)'
+	arg=[]
+	ARGV.each do |i|
+		arg<<i.strip
+		puts i.strip
+	end
+	while (a=gets.strip)!=''
+		arg<<a
+	end
+	puts 'Making list, wait patiently...'
+	s=Sunflower.new
+	s.login
+	l=s.make_list(t, *arg)
+	l.sort!
+	f=File.open('list.txt','w')
+	f.write(l.join("\n"))
+	f.close
+	puts 'Done! List saved to "list.txt".'
+end

data/lib/sunflower.rb ADDED Viewed

@@ -0,0 +1,4 @@
+# coding: utf-8
+require 'sunflower/core'
+require 'sunflower/commontasks'
+require 'sunflower/listmaker'

data/scripts/ZDBOT.rb ADDED Viewed

@@ -0,0 +1,62 @@
+require 'sunflower-core.rb'
+require 'sunflower-commontasks.rb'
+s=Sunflower.new
+s.login
+$summary='archiwizacja zadań'
+pp=Page.get('Wikipedia:Zadania dla botów')
+tasks=pp.text
+tasksDone=[]
+tasksError=[]
+tasksOld=[]
+tasks=tasks.gsub(/\n==\s*(.+?)\s*==\s*\{\{\/Status\|([^}]+)\}\}([\s\S]+?)(?=\r?\n==|\s*\Z)/) do
+	title=$1.strip
+	status=$2.strip
+	text=$3.strip
+	bval=''
+	if (['wykonane','zrobione','błąd','błędne','stare'].index(status)==nil)
+		bval=$&
+	elsif (status=='wykonane' || status=='zrobione')
+		tasksDone<<"== "+title+" ==\n{{/Status|"+status+"}}\n"+text
+	elsif (status=='błąd' || status=='błędne')
+		tasksError<<"== "+title+" ==\n{{/Status|"+status+"}}\n"+text
+	elsif (status=='stare')
+		tasksOld<<"== "+title+" ==\n{{/Status|"+status+"}}\n"+text
+	end
+	bval
+end
+puts 'Data loaded. Saving...'
+p=Page.get('Wikipedia:Zadania_dla_botów/Archiwum/błędne')
+p.append tasksError.join("\n\n") unless tasksError.empty?
+p.save unless tasksError.empty?
+puts 'Error - saved.'
+p=Page.get('Wikipedia:Zadania_dla_botów/Archiwum/wykonane')
+p.append tasksDone.join("\n\n") unless tasksDone.empty?
+p.save unless tasksDone.empty?
+puts 'Done - saved.'
+p=Page.get('Wikipedia:Zadania_dla_botów/Archiwum/stare')
+p.append tasksOld.join("\n\n") unless tasksOld.empty?
+p.save unless tasksOld.empty?
+puts 'Old - saved.'
+pp.text=tasks
+pp.save
+puts 'Main - saved.'
+# File.open('ZDBOT_main.txt','w').write(tasks)
+# File.open('ZDBOT_done.txt','w').write(tasksDone.join("\n\n")) unless tasksDone.empty?
+# File.open('ZDBOT_error.txt','w').write(tasksError.join("\n\n")) unless tasksError.empty?
+# File.open('ZDBOT_old.txt','w').write(tasksOld.join("\n\n")) unless tasksOld.empty?
+puts "Stats: done: #{tasksDone.length}; error: #{tasksError.length}; old: #{tasksOld.length}"
+gets

data/scripts/aktualizacjapilkarzy.rb ADDED Viewed

@@ -0,0 +1,339 @@
+require 'orderedhash'
+require 'hpricot'
+require 'net/http'
+require 'sunflower-core.rb'
+require 'sunflower-listmaker.rb'
+include Net
+$datafile=File.open('aktual.txt','w')
+$datafile.sync=true
+id2team={}
+begin
+	File.open('id2team.txt') do |f|
+		id2team.replace Hash[*f.read.strip.split(/\r?\n|\t/)]
+	end
+rescue
+end
+# comes from http://rubyforge.org/frs/?group_id=6257&release_id=36721
+module Levenshtein
+  VERSION	= "0.2.0"
+  # Returns the Levenshtein distance as a number between 0.0 and
+  # 1.0. It's basically the Levenshtein distance divided by the
+  # length of the longest sequence.
+  def self.normalized_distance(s1, s2, threshold=nil)
+    s1, s2	= s2, s1	if s1.length > s2.length	# s1 is the short one; s2 is the long one.
+    if s2.length == 0
+      0.0	# Since s1.length < s2.length, s1 must be empty as well.
+    else
+      if threshold
+        if d = self.distance(s1, s2, (threshold*s2.length+1).to_i)
+          d.to_f/s2.length
+        else
+          nil
+        end
+      else
+        self.distance(s1, s2).to_f/s2.length
+      end
+    end
+  end
+  # Returns the Levenshtein distance between two sequences.
+  #
+  # The two sequences can be two strings, two arrays, or two other
+  # objects. Strings, arrays and arrays of strings are handled with
+  # optimized (very fast) C code. All other sequences are handled
+  # with generic (fast) C code.
+  #
+  # The sequences should respond to :length and :[] and all objects
+  # in the sequences (as returned by []) should response to :==.
+  def self.distance(s1, s2, threshold=nil)
+    s1, s2	= s2, s1	if s1.length > s2.length	# s1 is the short one; s2 is the long one.
+    # Handle some basic circumstances.
+    return 0		if s1 == s2
+    return s2.length	if s1.length == 0
+    if threshold
+      return nil	if (s2.length-s1.length) >= threshold
+      a1, a2	= nil, nil
+      a1, a2	= s1, s2			if s1.respond_to?(:-) and s2.respond_to?(:-)
+      a1, a2	= s1.scan(/./), s2.scan(/./)	if s1.respond_to?(:scan) and s2.respond_to?(:scan)
+      if a1 and a2
+        return nil	if (a1-a2).length >= threshold
+        return nil	if (a2-a1).length >= threshold
+      end
+    end
+    distance_fast_or_slow(s1, s2, threshold)
+  end
+  def self.distance_fast_or_slow(s1, s2, threshold)	# :nodoc:
+    if respond_to?(:levenshtein_distance_fast)
+      levenshtein_distance_fast(s1, s2, threshold)	# Implemented in C.
+    else
+      levenshtein_distance_slow(s1, s2, threshold)	# Implemented in Ruby.
+    end
+  end
+  def self.levenshtein_distance_slow(s1, s2, threshold)	# :nodoc:
+    row	= (0..s1.length).to_a
+    1.upto(s2.length) do |y|
+      prow	= row
+      row	= [y]
+      1.upto(s1.length) do |x|
+        row[x]	= [prow[x]+1, row[x-1]+1, prow[x-1]+(s1[x-1]==s2[y-1] ? 0 : 1)].min
+      end
+      # Stop analysing this sequence as soon as the best possible
+      # result for this sequence is bigger than the best result so far.
+      # (The minimum value in the next row will be equal to or greater
+      # than the minimum value in this row.)
+      return nil	if threshold and row.min >= threshold
+    end
+    row[-1]
+  end
+end
+def puts *arg
+	arg.each{|str| $stdout.puts str; $datafile.puts str}
+end
+def saveData
+=begin
+	File.open('aktualdata.txt','w'){|f|
+		f.write "
+$notfound=#{$notfound.length}
+$same=#{$same.length}
+$diff=#{$diff.length}
+----
+$notfound:
+# {$notfound.join "\n"}
+----
+$same:
+# {$same.join "\n"}
+----
+$diff:
+# {$diff.join "\n"}
+"
+	}
+=end
+end
+def get(url)
+	return HTTP.get(URI.parse(url))
+end
+def getPlayerData url
+	r=get url
+	r=~/<b>All time playing career<\/b>/
+	r=$'
+	r=~/<a name=games><\/a>/
+	table=$`.strip
+	h=Hpricot.parse table
+	rows=h.search 'tr+tr'
+	data={}
+	rows.each do |r|
+		if r.at('td')['colspan']==nil && (r.inner_html=~/No appearance data available/)==nil
+			cells=r.search 'td'
+			team=cells[0].search('font a')[0].inner_html.strip
+			teamid=cells[0].search('font a')[0]['href'].sub(/\A.+?(\d+)\Z/, '\1')
+			matches=cells[4].at('font').inner_html.split('(').map{|m| m.gsub(/[^0-9]/,'').to_i}
+			matches=matches[0]+matches[1]
+			goals=cells[5].at('font').inner_html.gsub(/[^0-9]/,'').to_i
+			data[team]=[matches,goals,teamid]
+		end
+	end
+	return data
+end
+def searchForPlayer text
+	d=get "http://www.soccerbase.com/search.sd?search_string=#{CGI.escape text}&search_cat=players"
+	d=~/window.location = "(http:[^"]+)"/
+	return $1
+end
+$edits=0
+$summary='aktualizacja danych o meczach piłkarza'
+puts 'Making list...'
+s=Sunflower.new('pl.wikipedia.org')
+s.login
+enw=Sunflower.new('en.wikipedia.org')
+enw.login
+# list=(
+	# s.makeList('category-r', 'Kategoria:Piłkarze Aston Villa F.C.')+
+	# s.makeList('category-r', 'Kategoria:Piłkarze Chelsea F.C.')+
+	# s.makeList('category-r', 'Kategoria:Piłkarze Liverpool F.C.')
+# ).uniq
+# list=(
+	# s.makeList('category-r', 'Kategoria:Piłkarze angielskich klubów')+
+	# s.makeList('category-r', 'Kategoria:Piłkarze walijskich klubów')
+# ).uniq
+# list.delete_if{|i| i=~/^Kategoria:/}
+# File.open('lista-pilkarze.txt','w').write list.join("\n")
+# list=File.open('lista-pilkarze.txt').read.split(/\r?\n/)
+list=['Wikipedysta:Matma Rex/brudnopis']
+puts 'Done!'
+puts ''
+$notfound=[]
+$same=[]
+$diff=[]
+list.each_with_index do |art, i|
+	exit if $edits>4
+	# finding data
+	puts "* [[#{art}]]"
+	pPl=Page.new(art, 'pl')
+	pPl.read=~/\[\[en:([^\]]+)\]\]/
+	if $1
+		artEn=$1
+		puts "** Interwiki-en: [[:en:#{artEn}]]"
+	else
+		artEn=art
+		puts "** No interwiki; guessing [[:en:#{art}]]"
+	end
+	pPl.read=~/\{\{soccerbase.*?(\d+).*?\}\}|soccerbase\.com\/players_details\.sd\?playerid=(\d+)/i
+	if $1||$2
+		soccid=$1||$2
+		url="http://www.soccerbase.com/players_details.sd?playerid=#{soccid}"
+		puts '** Found id on plwiki'
+	else
+		pEn=Page.new(art, 'en')
+		pEn.read=~/\{\{soccerbase.*?(\d+).*?\}\}|soccerbase\.com\/players_details\.sd\?playerid=(\d+)/i
+		if $1||$2
+			soccid=$1||$2
+			url="http://www.soccerbase.com/players_details.sd?playerid=#{soccid}"
+			puts '** Found id on enwiki'
+		else
+			url=searchForPlayer(art)||searchForPlayer(artEn)
+		end
+	end
+	if url==nil
+		puts '** Not found.'
+		$notfound<<art
+	else
+		data=getPlayerData url
+		puts "** URL: #{url}"
+		unless data.empty?
+			puts "** Found info on soccerbase."
+		else
+			puts '** Found, but no data.'
+			$notfound<<art
+		end
+	end
+	pPl.read =~ /występy\(gole\)\s*=(.+)/
+	if $1==nil
+		puts '** Wiki: error. No infobox?'
+	else
+		a=$1.split(/\s*<br.*?>\s*/)[-1].strip
+		a=~/(\d+)\s*\((\d+)\)/
+		matchesW, goalsW = $1.to_i, $2.to_i
+		puts "** Wiki info:  #{matchesW} matches, #{goalsW} goals."
+	end
+	saveData if i%30==0 && i!=0
+	# $change=File.open('changelist.txt','w')
+	# $change.sync=true
+	# editing
+	if data
+		#$change.puts "* [[#{art}]] - #{matchesW}/#{goalsW} -> #{matches}/#{goals}"
+		pPl.text=~/(kluby\s*=\s*)([^\|]+)(\s*\|)/
+		kluby=$2
+		pPl.text=~/(występy\(gole\)\s*=\s*)([^\|]+)(\s*\|)/
+		wystepygole=$2
+		resolve={}
+		kluby=kluby.split(/<\/?br[^>]*>/).map do |i|
+			short=i.strip.gsub(/\[\[(?:[^\]\|]+\||)([^\]\|]+)\]\]/,'\1').gsub(/→|\(wyp\.\)/,'').strip
+			resolve[short]=i.strip
+			short
+		end
+		wystepygole=wystepygole.split(/<\/?br[^>]*?>/).map{|i| i.strip}
+		wystepygole.delete_if{|i| i==''}
+		kluby.delete_if{|i| i==''}
+		wystepygole.pop while wystepygole.length>kluby.length
+		wystepygole.push [0,0] while wystepygole.length<kluby.length
+		wikidata=OrderedHash.new
+		kluby.each_index do |i|
+			wystepygole[i]=~/(\d+)\s*\((\d+)\)/
+			wikidata[kluby[i]]=[$1.to_i, $2.to_i]
+		end
+		# puts data.inspect
+		# puts wikidata.inspect
+		data.each_pair do |scbclub, scb, teamid|
+			min=[999, 'null']
+			wikidata.each_pair do |wikiclub, wiki|
+				if wikiclub.index scbclub || scbclub.index wikiclub
+					min=[0, wikiclub]
+					break
+				end
+				if wikiclub.index id2team[teamid] || id2team[teamid].index wikiclub
+					min=[0, wikiclub]
+					break
+				end
+				d=Levenshtein.distance(scbclub, wikiclub)
+				min=[d, wikiclub] if d<min[0]
+				d=Levenshtein.distance(id2team[teamid], wikiclub)
+				min=[d, wikiclub] if d<min[0]
+			end
+			club=min[1]
+			wikidata[club]=data[scbclub]
+		end
+		infoboxwystepygole=[]
+		infoboxkluby=[]
+		wikidata.each do |club, info|
+			infoboxkluby<<resolve[club]
+			infoboxwystepygole<<"#{info[0]} (#{info[1]})"
+		end
+		infoboxkluby=infoboxkluby.join('<br />')
+		infoboxwystepygole=infoboxwystepygole.join('<br />')
+		pPl.text=pPl.text.sub(/(występy\(gole\)\s*=\s*)([^\|]+?)(\s*\|)/){$1+infoboxwystepygole+$3}
+		pPl.text=pPl.text.sub(/(kluby\s*=\s*)([^\|]+?)(\s*\|)/){$1+infoboxkluby+$3}
+		pPl.text=pPl.text.sub(/(data1\s*=\s*)([^\|]+?)(\s*\|)/, '\1{{subst:CURRENTDAY}} {{subst:CURRENTMONTHNAMEGEN}} {{subst:CURRENTYEAR}}\3')
+		$edits+=1
+		pPl.save
+	end
+end

data/scripts/author-list.rb ADDED Viewed

@@ -0,0 +1,36 @@
+#!/usr/bin/ruby
+print "Content-type: text/html; charset=utf8\n\r\n"
+$stderr=$stdout
+require 'sunflower-core.rb'
+s=Sunflower.new('pl.wikipedia.org')
+s.log=false
+s.login
+cgi=CGI.new
+puts ''
+puts '<p>Get list for: <form action="author-list.rb" method="GET"><input name="title"> <input type="submit" value="Go!"></form></p>'
+if cgi['title'] && cgi['title']!=''
+	puts '<p>List of authors of '+cgi['title']+':</p>'
+	users=[]
+	hash=s.API("action=query&prop=revisions&titles=#{CGI.escape(cgi['title'])}&rvprop=user&rvlimit=5000")
+	hash['query']['pages'].values[0]['revisions'].each do |r|
+		users<<r['user']
+	end
+	while hash['query-continue']
+		hash=s.API("action=query&prop=revisions&titles=#{CGI.escape(cgi['title'])}&rvprop=user&rvlimit=5000&rvstartid=#{hash['query-continue']['revisions']['rvstartid']}")
+		hash['query']['pages'].values[0]['revisions'].each do |r|
+			users<<r['user']
+	end
+	end
+	users.uniq!
+	puts '<ul><li>'+users.join('</li><li>')+'</li></ul>'
+end

data/scripts/changeimage.rb ADDED Viewed

@@ -0,0 +1,42 @@
+require 'sunflower-commontasks.rb'
+require 'sunflower-listmaker.rb'
+image='Plik:Obiekt zabytkowy znak.svg'
+# EDIT WIKI URL BELOW
+s=Sunflower.new('pl.wikipedia.org')
+print "Logging in to #{s.wikiURL}... "
+# EDIT USERNAME AND PASSWORD BELOW
+s.login
+print "done!\n"
+print "Reading articles list... "
+# EDIT FILENAME BELOW
+list=s.make_list('image', image).sort
+print "done!\n\n"
+# EDIT SUMMARY BELOW
+$summary='podmiana grafiki, [[WP:SK]]'
+list.each do |title|
+	print "Reading page #{title}... "
+	page=Page.get(title)
+	print "done.\n"
+	print "Modifying... "
+	page.codeCleanup
+	page.text.gsub!(/\[\[#{Regexp.escape image} *\|(?:left\||)[1-6]\dpx(?:\|left|)(\|[^\]\|]+|)\]\]( *(?:\r?\n|) *|)/) do
+		next if $~[0].index('thumb') || $~[0].index('right')
+		"[[Plik:Obiekt zabytkowy.svg|20px#{$1}]] "
+	end
+	print "done.\n"
+	print "Saving... "
+	page.save unless page.orig_text.downcase==page.text.downcase
+	print "done!\n\n"
+end
+print 'Finished! Press any key to close.'
+gets

data/scripts/fix-bold-in-headers.rb ADDED Viewed

@@ -0,0 +1,53 @@
+require "algorithm/diff"
+require 'sunflower-commontasks.rb'
+require 'sunflower-listmaker.rb'
+# EDIT WIKI URL BELOW
+s=Sunflower.new
+print "Logging in to #{s.wikiURL}... "
+# EDIT USERNAME AND PASSWORD BELOW
+s.login
+print "done!\n"
+print "Reading articles list... "
+# EDIT FILENAME BELOW
+list=s.make_list('file', 'list2.txt')
+print "done!\n\n"
+# EDIT SUMMARY BELOW
+$summary='usuwanie pogrubień z nagłówków, [[WP:SK]]'
+list.each do |title|
+	print "Reading page #{title}... "
+	page=Page.get(title)
+	print "done.\n"
+	print "Modifying... "
+	oldtxt=page.read
+	page.replace(/(==+)\s*'''\s*(.+?)\s*'''\s*\1/, '\1 \2 \1') #simplest fix
+	page.replace(/(==+)([^']*)'''([^']*)\1/, '\1\2\3\1') #broken bolds - opened, but not closed, remove them
+	page.write page.text.gsub(/(==+)\s*(Znan.+? (?:osoby|ludzie) (?:nosz|o imien).+?)\s*\1/){h=$1; "#{h} #{$2.gsub("'''", '')} #{h}"} #pl.wiki specific
+	page.write page.text.gsub(/(==+)\s*(.+?(?:\[\[imieniny\]\]|imieniny) obchodzi)\s*\1/){h=$1; "#{h} #{$2.gsub("'''", '')} #{h}"} #pl.wiki specific
+	if oldtxt==page.read
+		print "No changes.\n\n"
+		next
+	end
+	page.codeCleanup
+	# diffs = oldtxt.diff(page.read)
+	# puts diffs
+	# gets
+	print "done.\n"
+	print "Saving... "
+	page.save
+	print "done!\n\n"
+end
+print 'Finished! Press any key to close.'
+gets