From 99b601fa71481a358927f6d5c721c2a0f66f75e9 Mon Sep 17 00:00:00 2001 From: Stefan Schlott Date: Sun, 1 Sep 2013 09:59:49 +0200 Subject: [PATCH] Initial import script --- scripts/download-wikipage.rb | 30 ++++++++++++++++++++++++++++++ 1 file changed, 30 insertions(+) create mode 100755 scripts/download-wikipage.rb diff --git a/scripts/download-wikipage.rb b/scripts/download-wikipage.rb new file mode 100755 index 00000000..e6e1f221 --- /dev/null +++ b/scripts/download-wikipage.rb @@ -0,0 +1,30 @@ +#!/usr/bin/env ruby +# encoding: utf-8 + +require 'rubygems' +require 'bundler/setup' + +require 'nokogiri' +require 'open-uri' + + +def empty_p?(node) + node.name=='p' && node.content.length==0 + node.content.length==0 +end + + +if ARGV.length==0 + abort('Need one parameter (page name)') +end + +doc = Nokogiri::HTML(open("https://www.cccs.de/wiki/bin/view/Main/#{ARGV[0]}")) +content = doc.css('.twikiTopic').children + +File.open("#{ARGV[0]}.html", 'w') do |file| + file.write("---\n") + file.write("title: #{ARGV[0]}\n") + file.write("kind: page\n") + file.write("---\n") + file.write(content) +end