Suggest timepoints using OSM database of POIs
--- /dev/null
+++ b/maxious-canberra-transit-feed/01-extracttimes.rb
@@ -1,1 +1,95 @@
+require 'rubygems'
+require 'nokogiri'
+require 'open-uri'
+require 'pp'
+def makeTimetable(table, period, short_name)
+ timetable = {"stop_times" => [], "between_stops" => [], "short_name" => short_name}
+ time_points = table.xpath('tr[1]//th').map do |tp|
+ if tp.content != "\302\240" && tp.content != "" && tp.content != "<br/>"
+ timing_point = tp.content.squeeze(" ").gsub("\r\n Platform"," - Platform").gsub(" - "," - ").gsub("\n","").gsub("\r","").gsub("\\"," / ").strip
+ end
+ end
+ time_points.delete(nil)
+ timetable["time_points"] = time_points
+ timetable["long_name"] = "To " + time_points.last
+ periodtimes = []
+ table.css('tr').each do |row|
+ times = row.css('td').map do |cell|
+ #TODO convert to GTFS time ie. replace " AM" with a
+ time = cell.content.squeeze(" ").strip
+ end
+ if not times.empty?
+ if not (route = times.shift)
+ raise("TODO: account for shifting route numbers eg. intertown/redex 62/162")
+ end
+ periodtimes << times
+ end
+ end
+ if periodtimes.size < 1
+ raise "No times for route " + short_name + " in period " + period
+ end
+ timetable["stop_times"] = { period => periodtimes }
+ # pp timetable
+ filename = timetable["short_name"] + "-" + timetable["long_name"].downcase.gsub(" ","-").gsub("/","") + "." + period + ".yml"
+ puts "Saving " + filename
+ File.open("#{File.dirname(__FILE__)}/output/"+filename, "w") do |f|
+ f.write timetable.to_yaml
+ end
+ timetable
+end
+
+#TODO fix route 934
+Dir.glob("source-html/Route*.htm*") { |file|
+ puts "Opened " + file
+ doc = Nokogiri::HTML(open(file))
+ # Search for nodes by css
+ timetables = []
+ short_name = "";
+ doc.xpath('//title').each do |title|
+ short_name = title.content.gsub("Route_","").gsub("Route ","").squeeze(" ").strip
+ end
+ if short_name == ""
+ raise "Route number(s) not found in <title> tag"
+ end
+
+ doc.xpath('//table[preceding::text()="Weekdays"]').each do |table|
+ timetables << makeTimetable(table, "weekday", short_name)
+ end
+
+ #weekends
+ doc.xpath('//table[preceding::text()="Saturdays" and following::a]').each do |table|
+ timetables << makeTimetable(table, "saturday", short_name)
+ end
+ doc.xpath('//table[preceding::text()="Sundays"]').each do |table|
+ timetables << makeTimetable(table, "sunday", short_name)
+ end
+ #930/934 special cases
+ doc.xpath('//table[preceding::text()="Saturday" and following::h2]').each do |table|
+ timetables << makeTimetable(table, "saturday", short_name)
+ end
+ doc.xpath('//table[preceding::text()="Sunday"]').each do |table|
+ timetables << makeTimetable(table, "sunday", short_name)
+ end
+ #route 81 = Weekdays - School Holidays Only
+ doc.xpath('//table[preceding::text()="Weekdays - School Holidays Only "]').each do |table|
+ timetable = makeTimetable(table, "weekday", short_name)
+ #TODO set active date range to only be holidays
+ timetables << timetable;
+ end
+
+
+ if timetables.size > 2
+ puts "WARNING: " + file + " more than 2 timetables (weekend split?):" + timetables.size.to_s
+ end
+ if timetables.size < 2
+ puts "WARNING: " + file + " less than 2 timetables (weekday loop service?):" + timetables.size.to_s
+ elsif not (timetables[0]["time_points"] - timetables[1]["time_points"].reverse).empty?
+ puts "WARNING: first pair of timetable timing points are not complementary for "+ file
+ pp(timetables[0]["time_points"] - timetables[1]["time_points"].reverse)
+ end
+ if timetables.size < 1
+ raise "No timetables extracted from " + file
+ end
+}
+
--- /dev/null
+++ b/maxious-canberra-transit-feed/02-tidytimepoints.rb
@@ -1,1 +1,82 @@
+require 'rubygems'
+require 'pp'
+require 'yaml'
+Dir.chdir("output")
+def getTimePoints()
+ $time_points = []
+ $time_points_sources = Hash.new([])
+ Dir.glob("*.yml") { |file|
+ timetable = YAML::load_file(file)
+ $time_points = $time_points | timetable["time_points"]
+ timetable["time_points"].each do |timepoint|
+ $time_points_sources[timepoint] = $time_points_sources[timepoint] | [ file ]
+ end
+ }
+end
+
+getTimePoints()
+pp $time_points.sort!
+#pp $time_points_sources.sort
+
+time_point_corrections = {"North Lynehamham" => "North Lyneham",
+ "Lathlain St Platform 2" => "Lathlain St Bus Station - Platform 2",
+ "Lathlain St Sation - Platform 5" => "Lathlain St Bus Station - Platform 5",
+ "Lathlain Steet Station" => "Lathlain St Bus Station",
+ "Lathlain St - Platform 3" => "Lathlain St Bus Station - Platform 3",
+ "Lathlain Steet Station - Platform 3" => "Lathlain St Bus Station - Platform 3",
+ "Lathlain St Station" => "Lathlain St Bus Station",
+ "Lathlain St Station - Platform 1" => "Lathlain St Bus Station - Platform 1",
+ "Lathlain St Station - Platform 2" => "Lathlain St Bus Station - Platform 2",
+ "Lathlain St Station - Platform 3" => "Lathlain St Bus Station - Platform 3",
+ "Lathlain St Station - Platform 4" => "Lathlain St Bus Station - Platform 4",
+ "Lathlain St Station - Platform 5" => "Lathlain St Bus Station - Platform 5",
+ "Lathlain St Station - Platform 6" => "Lathlain St Bus Station - Platform 6",
+ "Manuka Captain Cook" => "Manuka, Captain Cook",
+ "Flemington Rd, Sandford St" => "Flemington Rd/Sandford St",
+ "Erindale Centre / - Sternberg Crescent" => "Erindale Drive/Sternberg",
+ "Canberra Hospita" => "Canberra Hospital",
+ "Cohen Str Station - Platform 1" => "Cohen St Bus Station - Platform 1",
+ "Cohen Street Station" => "Cohen St Bus Station",
+ "Cohen Street Station - Platform 2" => "Cohen St Bus Station - Platform 2",
+ "Cohn St Station - Platform 3" => "Cohen St Bus Station - Platform 3",
+ "Cohen St Station" => "Cohen St Bus Station",
+ "Cohen St Station - Platform 1" => "Cohen St Bus Station - Platform 1",
+ "Cohen St Station - Platform 2" => "Cohen St Bus Station - Platform 2",
+ "Cohen St Station - Platform 3" => "Cohen St Bus Station - Platform 3",
+ "Cohen St Station - Platform 4" => "Cohen St Bus Station - Platform 4",
+ "Cohen St Station - Platform 5" => "Cohen St Bus Station - Platform 5",
+ "Cohen St Station - Platform 6" => "Cohen St Bus Station - Platform 6",
+ "City - Platform 7" => "City Interchange - Platform 7",
+ "Cameron Avenue Station" => "Cameron Ave Bus Station",
+ "Cameron Avenue Station - Platform 1" => "Cameron Ave Bus Station - Platform 1",
+ "Cameron Avenue Station - Platform 2" => "Cameron Ave Bus Station - Platform 2",
+ "Cameron Avenue Station - Platform 3" => "Cameron Ave Bus Station - Platform 3",
+ "Cameron Avenue Station - Platform 4" => "Cameron Ave Bus Station - Platform 4",
+ "Cameron Avenue Station - Platform 5" => "Cameron Ave Bus Station - Platform 5",
+ "Cameron Ave Station" => "Cameron Ave Bus Station",
+ "Cameron Ave Station - Platform 1" => "Cameron Ave Bus Station - Platform 1",
+ "Cameron Ave Station - Platform 2" => "Cameron Ave Bus Station - Platform 2",
+ "Cameron Ave Station - Platform 3" => "Cameron Ave Bus Station - Platform 3",
+ "Cameron Ave Station - Platform 4" => "Cameron Ave Bus Station - Platform 4",
+ "Cameron Ave Station - Platform 5" => "Cameron Ave Bus Station - Platform 5",
+ "Burton & Garranan Hall, Daley Road ANU" => "Burton & Garran Hall, Daley Road ANU",
+ "Burton & Garranan Hall,Daley Road ANU" => "Burton & Garran Hall, Daley Road ANU",
+ "Newcastle Street after Isa St" => "Newcastle / Isa Street Fyshwick",
+ "National Circ/Canberra Ave" => "National Circuit / Canberra Ave",
+ }
+time_point_corrections.each do |wrong, right|
+ $time_points_sources[wrong].each do |wrongfile|
+ badtimetable = YAML::load_file(wrongfile)
+ badentrynumber = badtimetable["time_points"].index wrong
+ badtimetable["time_points"][badentrynumber] = right
+ puts "Corrected '" + wrong + "' to '" + right + "' in " + wrongfile
+ File.open(wrongfile, "w") do |f|
+ f.write badtimetable.to_yaml
+ end
+ end
+end
+
+getTimePoints()
+pp $time_points.sort!
+
--- /dev/null
+++ b/maxious-canberra-transit-feed/03-locatetimepoints.rb
@@ -1,1 +1,118 @@
+#!/usr/bin/ruby
+require 'postgres'
+require 'highline.rb'
+include HighLine
+
+require 'yaml'
+require 'pp'
+Dir.chdir("output")
+
+def getTimePoints()
+ $time_points = []
+ $time_points_sources = Hash.new([])
+ Dir.glob("*.yml") { |file|
+ timetable = YAML::load_file(file)
+ $time_points = $time_points | timetable["time_points"]
+ timetable["time_points"].each do |timepoint|
+ $time_points_sources[timepoint] = $time_points_sources[timepoint] | [ file ]
+ end
+ }
+end
+
+getTimePoints()
+$time_points.sort!
+
+connbus = PGconn.connect("localhost", 5432, '', '', "bus", "postgres",
+"snmc")
+connosm = PGconn.connect("localhost", 5432, '', '', "openstreetmap",
+"postgres", "snmc")
+
+if ask_if("Insert Timing Point names to database?")
+ $time_points.each do |time_point|
+ begin
+ time_point = time_point.gsub(/\\/, '\&\&').gsub(/'/, "''")
+ res = connbus.exec("INSERT INTO timing_point (name) VALUES ('#{time_point}')")
+ puts "Put '#{time_point}' into DB"
+ rescue PGError => e
+ puts "Error inserting '#{time_point}' to DB #{e}"
+ #conn.close() if conn
+ end
+ end
+end
+
+
+if ask_if("Fill null Timing Points from OSM bus_stop database?")
+ begin
+ null_points = connbus.exec('SELECT name FROM timing_point WHERE lat IS null OR lng IS null;')
+ rescue PGError => e
+ puts "Error selecting null points from DB #{e}"
+ #conn.close() if conn
+ end
+
+ null_points.each do |null_point_name|
+ begin
+ name = null_point_name.to_s.gsub(/\\/, '\&\&').gsub(/'/, "''")
+ pp name
+ matching_nodes = connosm.exec("Select * FROM (SELECT * from current_node_tags,
+ (Select id as ctagid FROM current_node_tags WHERE v LIKE '%#{name}%') as a
+ where a.ctagid = current_node_tags.id) as ctags INNER JOIN current_nodes ON
+ ctags.id=current_nodes.id")
+ rescue PGError => e
+ puts "Error selecting matching bus stops from DB #{e}"
+ #conn.close() if conn
+ end
+ suggested_nodes = Hash.new()
+
+ matching_nodes.each do |matching_node_row|
+ #pp matching_node_row
+ # 0 = id
+ # 1 = k
+ # 2 = v
+ # 3,4 = redundant ids
+ # 5 = lat*100000
+ # 6 = lng*100000
+ suggested_node = suggested_nodes.fetch(matching_node_row[0], {'lat' => Float(matching_node_row[5])/10000000,
+ 'lng' => Float(matching_node_row[6])/10000000})
+ if matching_node_row[1] == "ref"
+ matching_node_row[1] = "loc_ref"
+ end
+ suggested_node[matching_node_row[1]] = matching_node_row[2]
+ suggested_nodes[matching_node_row[0]] = suggested_node
+ end
+ pp suggested_nodes
+ nodeID = ask("Enter selected node ID:", :string)
+ if suggested_nodes.has_key?(nodeID)
+ node = suggested_nodes.fetch(nodeID)
+ guess = ask_if("Is this a guess?")
+ puts "Location #{node["lat"]},#{node["lng"]} for #{null_point_name}"
+ begin
+ res = connbus.exec("UPDATE timing_point SET lat = #{node["lat"]*10000000}, lng =
+#{node["lng"]*10000000},osm_node = #{nodeID}" + (node.has_key?("loc_ref") ? ",loc_ref = #{node["loc_ref"]}" : "") + ",guess = #{guess} WHERE name
+= '#{name}'")
+ puts "Put '#{null_point_name}' into DB"
+ rescue PGError => e
+ puts "Error inserting '#{null_point_name}' to DB #{e}"
+ ask_if("Continue?")
+ #conn.close() if conn
+ end
+ else
+ puts "Uhh, there was no suggestion ID like that. Try again next time!"
+ end
+ end
+end
+if ask_if("Fill null Timing Points from geocoder?")
+ begin
+ null_points = connbus.exec('SELECT name FROM timing_point WHERE lat IS null OR lng IS null;')
+ rescue PGError => e
+ puts "Error selecting null points from DB #{e}"
+ #conn.close() if conn
+ end
+
+ null_points.each do |null_point_name|
+ pp null_point_name
+ end
+end
+
+
+
--- /dev/null
+++ b/maxious-canberra-transit-feed/highline.rb
@@ -1,1 +1,140 @@
+module HighLine
+ # prompt = text to display
+ # type can be one of :string, :integer, :float, :bool or a proc
+ # if it's a proc then it is called with the entered string. If the input
+ # cannot be converted then it should throw an exception
+ # if type == :bool then y,yes are converted to true. n,no are converted to
+ # false. All other values are rejected.
+ #
+ # options should be a hash of validation options
+ # :validate => regular expresion or proc
+ # if validate is a regular expression then the input is matched against it
+ # if it's a proc then the proc is called and the input is accepted if it
+ # returns true
+ # :between => range
+ # the input is checked if it lies within the range
+ # :above => value
+ # the input is checked if it is above the value
+ # :below => value
+ # the input is checked if it is less than the value
+ # :default => string
+ # if the user doesn't enter a value then the default value is returned
+ # :base => [b, o, d, x]
+ # when asking for integers this will take a number in binary, octal,
+ # decimal or hexadecimal
+ def ask(prompt, type, options=nil)
+ begin
+ valid = true
+ default = option(options, :default)
+ if default
+ defaultstr = " |#{default}|"
+ else
+ defaultstr = ""
+ end
+
+ base = option(options, :base)
+
+ print prompt, "#{defaultstr} "
+ $stdout.flush
+ input = gets.chomp
+
+ if default && input == ""
+ input = default
+ end
+
+ #comvert the input to the correct type
+ input = case type
+ when :string: input
+ when :integer: convert(input, base) rescue valid = false
+ when :float: Float(input) rescue valid = false
+ when :bool
+ valid = input =~ /^(y|n|yes|no)$/
+ input[0] == ?y
+ when Proc: input = type.call(input) rescue valid = false
+ end
+
+ #validate the input
+ valid &&= validate(options, :validate) do |test|
+ case test
+ when Regexp: input =~ test
+ when Proc: test.call(input)
+ end
+ end
+ valid &&= validate(options, :within) { |range| range === input}
+ valid &&= validate(options, :above) { |value| input > value}
+ valid &&= validate(options, :below) { |value| input < value}
+
+ puts "Not a valid value" unless valid
+ end until valid
+
+ return input
+ end
+
+ #asks a yes/no question
+ def ask_if(prompt)
+ ask(prompt, :bool)
+ end
+
+ private
+
+ #extracts a key from the options hash
+ def option(options, key)
+ result = nil
+ if options && options.key?(key)
+ result = options[key]
+ end
+ result
+ end
+
+ #helper function for validation
+ def validate(options, key)
+ result = true
+ if options && options.key?(key)
+ result = yield options[key]
+ end
+ result
+ end
+
+ #converts a string to an integer
+ #input = the value to convert
+ #base = the numeric base of the value b,o,d,x
+ def convert(input, base)
+ if base
+ if ["b", "o", "d", "x"].include?(base)
+ input = "0#{base}#{input}"
+ value = Integer(input)
+ else
+ value = Integer(input)
+ end
+ else
+ value = Integer(input)
+ end
+
+ value
+ end
+end
+
+
+
+if __FILE__ == $0
+ include HighLine
+ #string input using a regexp to validate, returns test as the default value
+ p ask("enter a string, (all lower case)", :string, :validate => /^[a-z]*$/, :default => "test")
+ #string input using a proc to validate
+ p ask("enter a string, (between 3 and 6 characters)", :string, :validate => proc { |input| (3..6) === input.length})
+
+ #integer intput using :within
+ p ask("enter an integer, (0-10)", :integer, :within => 0..10)
+ #float input using :above
+ p ask("enter a float, (> 6)", :float, :above => 6)
+
+ #getting a binary value
+ p ask("enter a binary number", :integer, :base => "b")
+
+ #using a proc to convert the a comma seperated list into an array
+ p ask("enter a comma seperated list", proc { |x| x.split(/,/)})
+
+ p ask_if("do you want to continue?")
+end
+