1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
require 'rubygems'
require 'scrubyt'
require 'icalendar'
require 'date'

# enable logging
Scrubyt.logger = Scrubyt::Logger.new

# extract!
movie_data = Scrubyt::Extractor.define do
  fetch "http://www.film.at/filmstarts.php"

  # wrapper
  movie_stuff "/html/body/div/div/table", { :generalize => true } do
    date_name "/tr/td/span/div/a/b[1]"
    description "/tr/td/span/div[2]"
  end
  
  # get items from the other pages as well
  next_page "a[weiter]", :limit => 3
end

puts movie_data.to_xml