Skip to content

Instantly share code, notes, and snippets.

@plexus
Created December 29, 2012 14:32
Show Gist options
  • Save plexus/4407235 to your computer and use it in GitHub Desktop.
Save plexus/4407235 to your computer and use it in GitHub Desktop.
Naive parsing/generating off Mediawiki tables. I use this for automating some Wikipedia edits.
# -*- coding: utf-8 -*-
class WikiTable
attr_accessor :rows, :attributes
class Row
attr_accessor :cells, :attributes
def initialize
@cells = []
end
def <<(c); cells << c ; end
def to_s
"|-#{attributes}\n".tap do |s|
cells.each_with_index do |c,i|
s << (c.header? ? '!' : '|') if i == 0
s << (c.header? ? '!!' : '||') if i > 0
s << c
end
end
end
end
class Cell
attr_accessor :content, :attributes, :header
def initialize( content = nil, attributes = nil, header = false )
@content, @attributes, @header = content, attributes, header
end
def header? ; header ; end
def to_str
attributes ? "#{attributes}|#{content}" : content
end
def self.parse( cell )
if cell =~ /\|/
cell.split('|')
else
[ nil, cell ]
end
end
end
def initialize
@rows = []
end
def to_s
[
"{|#{attributes}",
rows.map(&:to_s),
"|}",
].join("\n")
end
def self.parse( content )
WikiTable.new.tap do |table|
current_row = Row.new
current_cell = nil
content.lines.each do |line|
line = line.strip
case line
when /^\{\|(.*)/
table.attributes = $1
when /^\|\}/
table.rows << current_row
break
when /^\|-(.*)/
table.rows << current_row
current_row = Row.new
current_row.attributes = $1
when /^\|[^\|].*\|\|/
line[1..-1].split('||').each do |cell|
current_cell = Cell.new
current_cell.attributes, current_cell.content = Cell.parse( cell )
current_row << current_cell
end
when /^!(.*)/
current_cell = Cell.new
current_cell.header = true
current_cell.attributes, current_cell.content = Cell.parse( line[1..-1] )
current_row << current_cell
end
end
end
end
end
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment