diff --git a/Filmnächte-Scraping.mw b/Filmnächte-Scraping.mw index e1b10a54..c064de0a 100644 --- a/Filmnächte-Scraping.mw +++ b/Filmnächte-Scraping.mw @@ -1,27 +1,19 @@ Bald sind wieder, ganz hipp, '''Filmnächte am Elbufer'''. Leider ist auf http://filmnaechte-am-elbufer.de/ keine sofort verwertbare Information zu finden. -
require 'htree'
-
 #
 # Saugen
 #
-
 #system("wget -O programm.html 'http://filmnaechte-am-elbufer.de/fn.php?idx=20'")
-
-
 #
 # Parsen
 #
-
 doc = HTree(File.new('programm.html')).to_rexml
 events = []
 spans = {}
 doc.each_element('/html/body//table[@style=\'width: 488px\']/tr/td//span') { |span|
   text = span.text.to_s
   text.gsub!(/\ ./, ' ')
-
   spans[span.attributes['class']] = text if text.size > 0
-
   if span.attributes['class'] == 'progTitle'
     events << spans
     spans = {'progDay'=>spans['progDay'],
@@ -29,25 +21,23 @@ doc.each_element('/html/body//table[@style=\'width: 488px\']/tr/td//span') { |sp
              'progWeek'=>spans['progWeek']}
   end
 }
-
-
 #
 # Ausgabe tabellarisch
 #
-
 column_sizes = Hash.new(0)
 events.each { |event|
   event.each { |column,cell|
     column_sizes[column] = cell.size if cell.size > column_sizes[column]
   }
 }
-
 events.each { |event|
   ptsd = event['progTitleSpecialDay']
   puts %w(progWeek progDay progTime progTitle).collect { |column|
     event[column].ljust(column_sizes[column] + 2)
   }.to_s.strip + (ptsd ? " (#{ptsd.strip})" : "")
 }
- - [[Kategorie:Ruby]] + + + +{{Rübÿ Spëëd Mëtäl Cödïng}}