Adding module for parsing files. This module is only included into the parsedfile provider base class, but it is cleaner to have it broken out like this.

git-svn-id: https://reductivelabs.com/svn/puppet/trunk@1855 980ebf18-57e1-0310-9a29-db15c13687c0
author: luke <luke@980ebf18-57e1-0310-9a29-db15c13687c0> 2006-11-10 23:52:02 +0000
committer: luke <luke@980ebf18-57e1-0310-9a29-db15c13687c0> 2006-11-10 23:52:02 +0000
commit: 7c8614b0589f7c843d17b9d16720419817394cee (patch)
tree: d2144ed9ed26ae509c30b3a738a8ae5e3e6e7b70
parent: f9d62136a76c9a8e6885261e6930414e8ae1f496 (diff)
download: puppet-7c8614b0589f7c843d17b9d16720419817394cee.tar.gz
puppet-7c8614b0589f7c843d17b9d16720419817394cee.tar.xz
puppet-7c8614b0589f7c843d17b9d16720419817394cee.zip
2 files changed, 565 insertions, 0 deletions
diff --git a/lib/puppet/util/fileparsing.rb b/lib/puppet/util/fileparsing.rb
new file mode 100644
index 000000000..e4998cf7e
--- /dev/null
+++ b/lib/puppet/util/fileparsing.rb
@@ -0,0 +1,200 @@
+# A mini-language for parsing files.  This is only used file the ParsedFile
+# provider, but it makes more sense to split it out so it's easy to maintain
+# in one place.
+#
+# You can use this module to create simple parser/generator classes.  For instance,
+# the following parser should go most of the way to parsing /etc/passwd:
+#
+#   class Parser
+#       include Puppet::Util::FileParsing
+#       record_line :user, :fields => %w{name password uid gid gecos home shell},
+#           :separator => ":"
+#   end
+#
+# You would use it like this:
+#
+#   parser = Parser.new
+#   lines = parser.parse(File.read("/etc/passwd"))
+#
+#   lines.each do |type, hash| # type will always be :user, since we only have one
+#       p hash
+#   end
+#
+# Each line in this case would be a hash, with each field set appropriately.
+# You could then call 'parser.to_line(hash)' on any of those hashes to generate
+# the text line again.
+
+module Puppet::Util::FileParsing
+    include Puppet::Util
+    attr_writer :line_separator, :trailing_separator
+
+    # Clear all existing record definitions.  Only used for testing.
+    def clear_records
+        @record_types.clear
+        @record_order.clear
+    end
+
+    # Try to match a specific text line.
+    def handle_text_line(line, hash)
+        if line =~ hash[:match]
+            return {:record_type => hash[:name], :line => line}
+        else
+            return nil
+        end
+    end
+
+    # Try to match a record.
+    def handle_record_line(line, hash)
+        if hash[:match]
+        else
+            ret = {}
+            hash[:fields].zip(line.split(hash[:separator])) do |param, value|
+                ret[param] = value
+            end
+            ret[:record_type] = hash[:name]
+            return ret
+        end
+    end
+
+    def line_separator
+        unless defined?(@line_separator)
+            @line_separator = "\n"
+        end
+
+        @line_separator
+    end
+
+    # Split text into separate lines using the record separator.
+    def lines(text)
+        # Remove any trailing separators, and then split based on them
+        text.sub(/#{self.line_separator}\Q/,'').split(self.line_separator)
+    end
+
+    # Split a bunch of text into lines and then parse them individually.
+    def parse(text)
+        lines(text).collect do |line|
+            parse_line(line)
+        end
+    end
+
+    # Handle parsing a single line.
+    def parse_line(line)
+        unless records?
+            raise Puppet::DevError, "No record types defined; cannot parse lines"
+        end
+
+        @record_order.each do |name|
+            hash = @record_types[name]
+            unless hash
+                raise Puppet::DevError, "Did not get hash for %s: %s" %
+                    [name, @record_types.inspect]
+            end
+            method = "handle_%s_line" % hash[:type]
+            if respond_to?(method)
+                if result = send(method, line, hash)
+                    return result
+                end
+            else
+                raise Puppet::DevError, "Somehow got invalid line type %s" % hash[:type]
+            end
+        end
+
+        return nil
+    end
+
+    # Define a new type of record.  These lines get split into hashes.
+    def record_line(name, options)
+        unless options.include?(:fields)
+            raise ArgumentError, "Must include a list of fields"
+        end
+
+        options[:fields] = options[:fields].collect do |field|
+            r = symbolize(field)
+            if r == :record_type
+                raise ArgumentError.new("Cannot have fields named record_type")
+            end
+            r
+        end
+
+        options[:separator] ||= /\s+/
+
+        # Unless they specified a string-based joiner, just use a single
+        # space as the join value.
+        unless options[:separator].is_a?(String) or options[:joiner]
+            options[:joiner] = " "
+        end
+
+        new_line_type(name, :record, options)
+    end
+
+    # Are there any record types defined?
+    def records?
+        defined?(@record_types) and ! @record_types.empty?
+    end
+
+    # Define a new type of text record.
+    def text_line(name, options)
+        unless options.include?(:match)
+            raise ArgumentError, "You must provide a :match regex for text lines"
+        end
+
+        new_line_type(name, :text, options)
+    end
+
+    # Generate a file from a bunch of hash records.
+    def to_file(records)
+        text = records.collect { |record| to_line(record) }.join(line_separator)
+
+        if trailing_separator
+            text += line_separator
+        end
+
+        return text
+    end
+
+    # Convert our parsed record into a text record.
+    def to_line(details)
+        unless type = @record_types[details[:record_type]]
+            raise ArgumentError, "Invalid record type %s" % details[:record_type]
+        end
+
+        case type[:type]
+        when :text: return details[:line]
+        else
+            joinchar = type[:joiner] || type[:separator]
+
+            return type[:fields].collect { |field| details[field].to_s }.join(joinchar)
+        end
+    end
+
+    # Whether to add a trailing separator to the file.  Defaults to true
+    def trailing_separator
+        if defined? @trailing_separator
+            return @trailing_separator
+        else
+            return true
+        end
+    end
+
+    private
+    # Define a new type of record.
+    def new_line_type(name, type, options)
+        @record_types ||= {}
+        @record_order ||= []
+
+        name = symbolize(name)
+
+        if @record_types.include?(name)
+            raise ArgumentError, "Line type %s is already defined" % name
+        end
+
+        options[:name] = name
+        options[:type] = type
+        @record_types[name] = options
+        @record_order << name
+
+        return options
+    end
+end
+
+# $Id$
diff --git a/test/util/fileparsing.rb b/test/util/fileparsing.rb
new file mode 100755
index 000000000..f5cf0d255
--- /dev/null
+++ b/test/util/fileparsing.rb
@@ -0,0 +1,365 @@
+#!/usr/bin/env ruby
+
+$:.unshift("../lib").unshift("../../lib") if __FILE__ =~ /\.rb$/
+
+require 'puppettest'
+require 'puppettest/fileparsing'
+require 'puppet'
+require 'puppet/util/fileparsing'
+
+class TestUtilFileParsing < Test::Unit::TestCase
+	include PuppetTest
+	include PuppetTest::FileParsing
+
+    class FParser
+        include Puppet::Util::FileParsing
+    end
+
+    def test_lines
+        parser = FParser.new
+
+        assert_equal("\n", parser.line_separator,
+            "Default separator was incorrect")
+
+        {"\n" => ["one two\nthree four", "one two\nthree four\n"],
+         "\t" => ["one two\tthree four", "one two\tthree four\t"],
+        }.each do |sep, tests|
+            assert_nothing_raised do
+                parser.line_separator = sep
+            end
+            assert_equal(sep, parser.line_separator,
+                "Did not set separator")
+
+            tests.each do |test|
+                assert_equal(["one two", "three four"], parser.lines(test),
+                    "Incorrectly parsed %s" % test.inspect)
+            end
+        end
+    end
+
+    # Make sure parse calls the appropriate methods or errors out
+    def test_parse
+        parser = FParser.new
+
+        parser.meta_def(:parse_line) do |line|
+            line.split(/\s+/)
+        end
+
+        text = "one line\ntwo line"
+        should = [%w{one line}, %w{two line}]
+        ret = nil
+        assert_nothing_raised do
+            ret = parser.parse(text)
+        end
+
+        assert_equal(should, ret)
+    end
+
+    # Make sure we correctly handle different kinds of text lines.
+    def test_text_line
+        parser = FParser.new
+
+        comment = "# this is a comment"
+
+        # Make sure it fails if no regex is passed
+        assert_raise(ArgumentError) do
+            parser.text_line :comment
+        end
+
+        # define a text matching comment record
+        assert_nothing_raised do
+            parser.text_line :comment, :match => /^#/
+        end
+
+        # Make sure it matches
+        assert_nothing_raised do
+            assert_equal({:record_type => :comment, :line => comment}, 
+                 parser.parse_line(comment))
+        end
+
+        # But not something else
+        assert_nothing_raised do
+            assert_nil(parser.parse_line("some other text"))
+        end
+
+        # Now define another type and make sure we get the right one back
+        assert_nothing_raised do
+            parser.text_line :blank, :match => /^\s*$/
+        end
+
+        # The comment should still match
+        assert_nothing_raised do
+            assert_equal({:record_type => :comment, :line => comment}, 
+                 parser.parse_line(comment))
+        end
+
+        # As should our new line type
+        assert_nothing_raised do
+            assert_equal({:record_type => :blank, :line => ""}, 
+                 parser.parse_line(""))
+        end
+
+    end
+
+    def test_parse_line
+        parser = FParser.new
+
+        comment = "# this is a comment"
+
+        # Make sure it fails if we don't have any record types defined
+        assert_raise(Puppet::DevError) do
+            parser.parse_line(comment)
+        end
+
+        # Now define a text matching comment record
+        assert_nothing_raised do
+            parser.text_line :comment, :match => /^#/
+        end
+
+        # And make sure we can't define another one with the same name
+        assert_raise(ArgumentError) do
+            parser.text_line :comment, :match => /^"/
+        end
+
+        result = nil
+        assert_nothing_raised("Did not parse text line") do
+            result = parser.parse_line comment
+        end
+
+        assert_equal({:record_type => :comment, :line => comment}, result)
+
+        # Make sure we just return nil on unmatched lines.
+        assert_nothing_raised("Did not parse text line") do
+            result = parser.parse_line "No match for this"
+        end
+
+        assert_nil(result, "Somehow matched an empty line")
+
+        # Now define another type of comment, and make sure both types get
+        # correctly returned as comments
+        assert_nothing_raised do
+            parser.text_line :comment2, :match => /^"/
+        end
+
+        assert_nothing_raised("Did not parse old comment") do
+            assert_equal({:record_type => :comment, :line => comment}, 
+                 parser.parse_line(comment))
+        end
+        comment = '" another type of comment'
+        assert_nothing_raised("Did not parse new comment") do
+            assert_equal({:record_type => :comment2, :line => comment}, 
+                 parser.parse_line(comment))
+        end
+
+        # Now define two overlapping record types and make sure we keep the
+        # correct order.  We do first match, not longest match.
+        assert_nothing_raised do
+            parser.text_line :one, :match => /^y/
+            parser.text_line :two, :match => /^yay/
+        end
+
+        assert_nothing_raised do
+            assert_equal({:record_type => :one, :line => "yayness"},
+                parser.parse_line("yayness"))
+        end
+
+    end
+
+    def test_record_line
+        parser = FParser.new
+
+        tabrecord = "tab	separated	content"
+        spacerecord = "space separated content"
+
+        # Make sure we always require an appropriate set of options
+        [{:separator => "\t"}, {}, {:fields => %w{record_type}}].each do |opts|
+            assert_raise(ArgumentError, "Accepted %s" % opts.inspect) do
+                parser.record_line :record, opts
+            end
+        end
+
+        # Verify that our default separator is tabs
+        tabs = nil
+        assert_nothing_raised do
+            tabs = parser.record_line :tabs, :fields => [:name, :first, :second]
+        end
+
+        # Make sure out tab line gets matched
+        tabshould = {:record_type => :tabs, :name => "tab", :first => "separated",
+                            :second => "content"}
+        assert_nothing_raised do
+            assert_equal(tabshould, parser.handle_record_line(tabrecord, tabs))
+        end
+
+        # Now add our space-separated record type
+        spaces = nil
+        assert_nothing_raised do
+            spaces = parser.record_line :spaces, :fields => [:name, :first, :second]
+        end
+
+        # Now make sure both lines parse correctly
+        spaceshould = {:record_type => :spaces, :name => "space",
+            :first => "separated", :second => "content"}
+
+        assert_nothing_raised do
+            assert_equal(tabshould, parser.handle_record_line(tabrecord, tabs))
+            assert_equal(spaceshould, parser.handle_record_line(spacerecord, spaces))
+        end
+    end
+
+    def test_to_line
+        parser = FParser.new
+
+        parser.text_line :comment, :match => /^#/
+        parser.text_line :blank, :match => /^\s*$/
+        parser.record_line :record, :fields => %w{name one two}, :joiner => "\t"
+
+        johnny = {:record_type => :record, :name => "johnny", :one => "home",
+            :two => "yay"}
+        bill = {:record_type => :record, :name => "bill", :one => "work",
+            :two => "boo"}
+
+        records = {
+            :comment => {:record_type => :comment, :line => "# This is a file"},
+            :blank => {:record_type => :blank, :line => ""},
+            :johnny => johnny,
+            :bill => bill
+        }
+
+        lines = {
+            :comment => "# This is a file",
+            :blank => "",
+            :johnny => "johnny	home	yay",
+            :bill => "bill	work	boo"
+        }
+
+        records.each do |name, details|
+            result = nil
+            assert_nothing_raised do
+                result = parser.to_line(details)
+            end
+
+            assert_equal(lines[name], result)
+        end
+        order = [:comment, :blank, :johnny, :bill]
+
+        file = order.collect { |name| lines[name] }.join("\n")
+
+        ordered_records = order.collect { |name| records[name] }
+
+        # Make sure we default to a trailing separator
+        assert_equal(true, parser.trailing_separator,
+            "Did not default to a trailing separtor")
+
+        # Start without a trailing separator
+        parser.trailing_separator = false
+        assert_nothing_raised do
+            assert_equal(file, parser.to_file(ordered_records))
+        end
+
+        # Now with a trailing separator
+        file += "\n"
+        parser.trailing_separator = true
+        assert_nothing_raised do
+            assert_equal(file, parser.to_file(ordered_records))
+        end
+
+        # Now try it with a different separator, so we're not just catching
+        # defaults
+        file.gsub!("\n", "\t")
+        parser.line_separator = "\t"
+        assert_nothing_raised do
+            assert_equal(file, parser.to_file(ordered_records))
+        end
+    end
+
+    # Make sure we can specify a different join character than split character
+    def test_split_join_record_line
+        parser = FParser.new
+
+        check = proc do |start, record, final|
+            # Check parsing first
+            assert_equal(record, parser.parse_line(start),
+                "Did not correctly parse %s" % start.inspect)
+
+            # And generating
+            assert_equal(final, parser.to_line(record),
+                "Did not correctly generate %s from %s" %
+                [final.inspect, record.inspect])
+        end
+
+        # First try it with symmetric characters
+        parser.record_line :symmetric, :fields => %w{one two},
+            :separator => " "
+
+        check.call "a b",
+            {:record_type => :symmetric, :one => "a", :two => "b"}, "a b"
+
+        # Now assymetric but both strings
+        parser.record_line :asymmetric, :fields => %w{one two},
+            :separator => "\t", :joiner => " "
+
+        check.call "a\tb",
+            {:record_type => :symmetric, :one => "a", :two => "b"}, "a b"
+
+        # And assymmetric with a regex
+        parser.record_line :asymmetric2, :fields => %w{one two},
+            :separator => /\s+/, :joiner => " "
+
+        check.call "a\tb",
+            {:record_type => :symmetric, :one => "a", :two => "b"}, "a b"
+        check.call "a b",
+            {:record_type => :symmetric, :one => "a", :two => "b"}, "a b"
+    end
+
+    # Make sure we correctly regenerate files.
+    def test_to_file
+        parser = FParser.new
+
+        parser.text_line :comment, :match => /^#/
+        parser.text_line :blank, :match => /^\s*$/
+        parser.record_line :record, :fields => %w{name one two}
+
+        text = "# This is a comment
+
+johnny one two
+billy three four"
+
+        # Just parse and generate, to make sure it's isomorphic.
+        assert_nothing_raised do
+            assert_equal
+        end
+    end
+
+    # Make sure we correctly handle optional fields.  We'll skip this
+    # functionality until we really know we need it.
+    def disabled_test_optional_fields
+        parser = FParser.new
+
+        assert_nothing_raised do
+            parser.record_line :record,
+                :fields => %w{one two three four},
+                :optional => %w{three four},
+                :separator => " " # A single space
+        end
+
+        ["a b c d", "a b  d", "a b", "a b  ", "a b c"].each do |line|
+            record = nil
+            assert_nothing_raised do
+                record = parser.parse_line(line)
+            end
+
+            # Now regenerate the line
+            newline = nil
+            assert_nothing_raised do
+                newline = parser.to_line(record)
+            end
+
+            # And make sure they're equal
+            assert_equal(line, newline)
+        end
+    end
+end
+
+# $Id$
+
author	luke <luke@980ebf18-57e1-0310-9a29-db15c13687c0>	2006-11-10 23:52:02 +0000
committer	luke <luke@980ebf18-57e1-0310-9a29-db15c13687c0>	2006-11-10 23:52:02 +0000
commit	7c8614b0589f7c843d17b9d16720419817394cee (patch)
tree	d2144ed9ed26ae509c30b3a738a8ae5e3e6e7b70
parent	f9d62136a76c9a8e6885261e6930414e8ae1f496 (diff)
download	puppet-7c8614b0589f7c843d17b9d16720419817394cee.tar.gz puppet-7c8614b0589f7c843d17b9d16720419817394cee.tar.xz puppet-7c8614b0589f7c843d17b9d16720419817394cee.zip