#!/usr/bin/ruby =begin -------------------------------------------------------------------------------- A utility that reads an RDF file, builds a model, sorts all of the URIs that have labels, and associates those URIs with the labels in a supplied text file, one line per label. These labels are assigned the language specified on the command line, and the resulting RDF statements are sent to standard output as N3. On the command line provide the path to the RDF file, the path to the labels file, and the desired language/locale. E.g.: label_inserter.rb ../../vivo-core-1.5-annotations.rdf labels.file es_ES -------------------------------------------------------------------------------- =end $: << File.dirname(File.expand_path(__FILE__)) require 'rubygems' require 'rdf' require 'label_common' include RDF class LabelStripper # ------------------------------------------------------------------------------------ private # ------------------------------------------------------------------------------------ # # Parse the arguments and complain if they don't make sense. # def sanity_check_arguments(args) raise "usage is: label_inserter.rb [ok]" unless (4..5).include?(args.length) if args[4].nil? ok = false elsif args[4].downcase == 'ok' ok = true else raise "fifth argument, if present, must be 'ok'" end rdf_file = args[0] raise "File '#{rdf_file}' does not exist." unless File.exist?(rdf_file) labels_input_file = args[1] raise "File '#{labels_input_file}' does not exist." unless File.exist?(labels_input_file) locale = args[2] raise "Locale should be like 'ab' or 'ab-CD'." unless /^[a-z]{2}(-[A-Z]{2})?$/ =~ locale n3_output_file = args[3] raise "File '#{n3_output_file}' already exists. specify 'ok' to overwrite it." if File.exist?(n3_output_file) && !ok return rdf_file, labels_input_file, locale, n3_output_file end # ------------------------------------------------------------------------------------ public # ------------------------------------------------------------------------------------ def initialize(args) @rdf_file, @labels_input_file, @locale, @n3_output_file = sanity_check_arguments(args) end def process(&filter) filter = filter || lambda{true} query = Query.new({ :prop => { RDFS.label => :label, } }) solutions = LabelCommon.new(@rdf_file).process(query, &filter) labels = IO.readlines(@labels_input_file) raise "Number of labels (#{labels.length}) doesn't match number of URIs (#{solutions.length})" unless labels.length == solutions.length graph = Graph.new solutions.zip(labels).each do |data| s = data[0].prop p = RDFS.label o = Literal.new(data[1].chomp, :language => @locale) graph << Statement.new(s, p, o) end File.open(@n3_output_file, 'w') do |f| f.puts graph.dump(:ntriples) end end end # # # ------------------------------------------------------------------------------------ # Standalone calling. # # Do this if this program was called from the command line. That is, if the command # expands to the path of this file. # ------------------------------------------------------------------------------------ # vivo_filter = lambda {|s| s.prop.start_with?("http://vivoweb.org/ontology/core#") && !s.label.to_s.strip.empty?} if File.expand_path($0) == File.expand_path(__FILE__) stripper = LabelStripper.new(ARGV) stripper.process(&vivo_filter) end