From 03a6502403b8bbbfe30fd1e94bd594353df986e4 Mon Sep 17 00:00:00 2001 From: AstRobot Date: Mon, 10 Jul 2006 19:23:46 +0000 Subject: [PATCH] =?UTF-8?q?This=20page=20must=20use=20the=20R=C3=BCb=C3=BF?= =?UTF-8?q?=20Sp=C3=AB=C3=ABd=20M=C3=ABt=C3=A4l=20C=C3=B6d=C3=AFng=20templ?= =?UTF-8?q?ate!!!111?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- Filmnächte-Scraping.mw | 18 ++++-------------- 1 file changed, 4 insertions(+), 14 deletions(-) diff --git a/Filmnächte-Scraping.mw b/Filmnächte-Scraping.mw index e1b10a54..c064de0a 100644 --- a/Filmnächte-Scraping.mw +++ b/Filmnächte-Scraping.mw @@ -1,27 +1,19 @@ Bald sind wieder, ganz hipp, '''Filmnächte am Elbufer'''. Leider ist auf http://filmnaechte-am-elbufer.de/ keine sofort verwertbare Information zu finden. -
require 'htree'
-
 #
 # Saugen
 #
-
 #system("wget -O programm.html 'http://filmnaechte-am-elbufer.de/fn.php?idx=20'")
-
-
 #
 # Parsen
 #
-
 doc = HTree(File.new('programm.html')).to_rexml
 events = []
 spans = {}
 doc.each_element('/html/body//table[@style=\'width: 488px\']/tr/td//span') { |span|
   text = span.text.to_s
   text.gsub!(/\ ./, ' ')
-
   spans[span.attributes['class']] = text if text.size > 0
-
   if span.attributes['class'] == 'progTitle'
     events << spans
     spans = {'progDay'=>spans['progDay'],
@@ -29,25 +21,23 @@ doc.each_element('/html/body//table[@style=\'width: 488px\']/tr/td//span') { |sp
              'progWeek'=>spans['progWeek']}
   end
 }
-
-
 #
 # Ausgabe tabellarisch
 #
-
 column_sizes = Hash.new(0)
 events.each { |event|
   event.each { |column,cell|
     column_sizes[column] = cell.size if cell.size > column_sizes[column]
   }
 }
-
 events.each { |event|
   ptsd = event['progTitleSpecialDay']
   puts %w(progWeek progDay progTime progTitle).collect { |column|
     event[column].ljust(column_sizes[column] + 2)
   }.to_s.strip + (ptsd ? " (#{ptsd.strip})" : "")
 }
- - [[Kategorie:Ruby]] + + + +{{Rübÿ Spëëd Mëtäl Cödïng}}