123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242 |
- ##
- # A parser is simple a class that subclasses RDoc::Parser and implements #scan
- # to fill in an RDoc::TopLevel with parsed data.
- #
- # The initialize method takes an RDoc::TopLevel to fill with parsed content,
- # the name of the file to be parsed, the content of the file, an RDoc::Options
- # object and an RDoc::Stats object to inform the user of parsed items. The
- # scan method is then called to parse the file and must return the
- # RDoc::TopLevel object. By calling super these items will be set for you.
- #
- # In order to be used by RDoc the parser needs to register the file extensions
- # it can parse. Use ::parse_files_matching to register extensions.
- #
- # require 'rdoc'
- #
- # class RDoc::Parser::Xyz < RDoc::Parser
- # parse_files_matching /\.xyz$/
- #
- # def initialize top_level, file_name, content, options, stats
- # super
- #
- # # extra initialization if needed
- # end
- #
- # def scan
- # # parse file and fill in @top_level
- # end
- # end
- class RDoc::Parser
- @parsers = []
- class << self
- ##
- # An Array of arrays that maps file extension (or name) regular
- # expressions to parser classes that will parse matching filenames.
- #
- # Use parse_files_matching to register a parser's file extensions.
- attr_reader :parsers
- end
- ##
- # Alias an extension to another extension. After this call, files ending
- # "new_ext" will be parsed using the same parser as "old_ext"
- def self.alias_extension(old_ext, new_ext)
- old_ext = old_ext.sub(/^\.(.*)/, '\1')
- new_ext = new_ext.sub(/^\.(.*)/, '\1')
- parser = can_parse "xxx.#{old_ext}"
- return false unless parser
- RDoc::Parser.parsers.unshift [/\.#{new_ext}$/, parser]
- true
- end
- ##
- # Determines if the file is a "binary" file which basically means it has
- # content that an RDoc parser shouldn't try to consume.
- def self.binary?(file)
- return false if file =~ /\.(rdoc|txt)$/
- s = File.read(file, 1024) or return false
- have_encoding = s.respond_to? :encoding
- if have_encoding then
- return false if s.encoding != Encoding::ASCII_8BIT and s.valid_encoding?
- end
- return true if s[0, 2] == Marshal.dump('')[0, 2] or s.index("\x00")
- if have_encoding then
- s.force_encoding Encoding.default_external
- not s.valid_encoding?
- else
- if 0.respond_to? :fdiv then
- s.count("\x00-\x7F", "^ -~\t\r\n").fdiv(s.size) > 0.3
- else # HACK 1.8.6
- (s.count("\x00-\x7F", "^ -~\t\r\n").to_f / s.size) > 0.3
- end
- end
- end
- ##
- # Processes common directives for CodeObjects for the C and Ruby parsers.
- #
- # Applies +directive+'s +value+ to +code_object+, if appropriate
- def self.process_directive code_object, directive, value
- warn "RDoc::Parser::process_directive is deprecated and wil be removed in RDoc 4. Use RDoc::Markup::PreProcess#handle_directive instead" if $-w
- case directive
- when 'nodoc' then
- code_object.document_self = nil # notify nodoc
- code_object.document_children = value.downcase != 'all'
- when 'doc' then
- code_object.document_self = true
- code_object.force_documentation = true
- when 'yield', 'yields' then
- # remove parameter &block
- code_object.params.sub!(/,?\s*&\w+/, '') if code_object.params
- code_object.block_params = value
- when 'arg', 'args' then
- code_object.params = value
- end
- end
- ##
- # Checks if +file+ is a zip file in disguise. Signatures from
- # http://www.garykessler.net/library/file_sigs.html
- def self.zip? file
- zip_signature = File.read file, 4
- zip_signature == "PK\x03\x04" or
- zip_signature == "PK\x05\x06" or
- zip_signature == "PK\x07\x08"
- end
- ##
- # Return a parser that can handle a particular extension
- def self.can_parse(file_name)
- parser = RDoc::Parser.parsers.find { |regexp,| regexp =~ file_name }.last
- # HACK Selenium hides a jar file using a .txt extension
- return if parser == RDoc::Parser::Simple and zip? file_name
- # The default parser must not parse binary files
- ext_name = File.extname file_name
- return parser if ext_name.empty?
- return if parser == RDoc::Parser::Simple and ext_name !~ /txt|rdoc/
- parser
- end
- ##
- # Finds and instantiates the correct parser for the given +file_name+ and
- # +content+.
- def self.for top_level, file_name, content, options, stats
- return if binary? file_name
- parser = use_markup content
- unless parser then
- # If no extension, look for shebang
- if file_name !~ /\.\w+$/ && content =~ %r{\A#!(.+)} then
- shebang = $1
- case shebang
- when %r{env\s+ruby}, %r{/ruby}
- file_name = "dummy.rb"
- end
- end
- parser = can_parse file_name
- end
- return unless parser
- parser.new top_level, file_name, content, options, stats
- end
- ##
- # Record which file types this parser can understand.
- #
- # It is ok to call this multiple times.
- def self.parse_files_matching(regexp)
- RDoc::Parser.parsers.unshift [regexp, self]
- end
- ##
- # If there is a <tt>markup: parser_name</tt> comment at the front of the
- # file, use it to determine the parser. For example:
- #
- # # markup: rdoc
- # # Class comment can go here
- #
- # class C
- # end
- #
- # The comment should appear as the first line of the +content+.
- #
- # If the content contains a shebang or editor modeline the comment may
- # appear on the second or third line.
- #
- # Any comment style may be used to hide the markup comment.
- def self.use_markup content
- markup = content.lines.first(3).grep(/markup:\s+(\w+)/) { $1 }.first
- return unless markup
- return RDoc::Parser::Ruby if markup == 'tomdoc'
- markup = Regexp.escape markup
- RDoc::Parser.parsers.find do |_, parser|
- /^#{markup}$/i =~ parser.name.sub(/.*:/, '')
- end.last
- end
- ##
- # Creates a new Parser storing +top_level+, +file_name+, +content+,
- # +options+ and +stats+ in instance variables. In +@preprocess+ an
- # RDoc::Markup::PreProcess object is created which allows processing of
- # directives.
- def initialize top_level, file_name, content, options, stats
- @top_level = top_level
- @top_level.parser = self.class
- @file_name = file_name
- @content = content
- @options = options
- @stats = stats
- @preprocess = RDoc::Markup::PreProcess.new @file_name, @options.rdoc_include
- @preprocess.options = @options
- end
- autoload :RubyTools, 'rdoc/parser/ruby_tools'
- autoload :Text, 'rdoc/parser/text'
- end
- # simple must come first in order to show up last in the parsers list
- require 'rdoc/parser/simple'
- require 'rdoc/parser/rd'
- require 'rdoc/parser/ruby'
- require 'rdoc/parser/c'
|