devdaily home | apple | java | perl | unix | directory | blog

What this is

This file is included in the DevDaily.com "Ruby Source Code Warehouse" project. The intent of this project is to help you "Learn Ruby by Example" TM.

Other links

The source code

# Copyritght (c) 2002 TANIGUCHI Takaki
# This program is distributed under the GNU GPL 2 or later.

require 'strscan'
require 'uri/common'
require 'delegate'
require 'pstore'

module AsWiki
  module FileScanner
    def FileScanner::[](pname)
      pspath = File.join($DIR_CACHE, "#{AsWiki::escape(pname)}.scan")
      ps = PStore.new(pspath.untaint)
      r = Repository.new
      ps.transaction do |s| 
	if r.mtime(pname) > File.mtime(pspath) or not s.root?('scan') # XXX 
	  scan = Scanner.new(r.load(pname).to_s)
	  s['scan'] = scan
	  # STDERR.puts "NOT #{pname}"
	  return scan
	else	  
	  # STDERR.puts "HIT #{pname}"
	  return s['scan']
	end	    
      end
    end
  end
  class Scanner
    PAT_URI =  /\A#{URI::REGEXP::PATTERN::X_ABS_URI}/xn
    C128 = [128].pack('C')
    C255 = [255].pack('C')
    def initialize(str)
      @q = scan(str)
    end
    def next_token
      return (@q.shift or [:EOF, nil]) # XXX raise??
    end
    private
    def scan(f)
      q = [] 
      sc = StringScanner.new(f.to_s)
      bol = true
      while sc.rest? do
	if bol
	  bol = false
	  if    tmp = sc.scan(/\A#begin .*$/)
	    q.push [:PLUGIN_BEGIN, tmp]
	  elsif tmp = sc.scan(/\A#end *$/)
	    q.push [:PLUGIN_END, tmp]
	  elsif tmp = sc.scan(/\A#.+$/)
	    q.push [:PLUGIN, tmp]
	  elsif tmp = sc.scan(/\A *\*/)
	    q.push [:UL, tmp]
	  elsif tmp = sc.scan(/\A *\(\d+\)/)
	    q.push [:OL, tmp]
	  elsif tmp = sc.scan(/\A *\+ */)
	    q.push [:DL, tmp]
	  elsif tmp = sc.scan(/\A={2,6}/)
	    q.push [:HN_BEGIN, tmp]
	  elsif tmp = sc.scan(/\A---- *$/)
	    q.push [:HR, tmp]
	  elsif tmp = sc.scan(/\A *\|\|/)
	    q.push [:TABLE_BEGIN, tmp]
	  elsif tmp = sc.scan(/\A\{\{\{ *$/)
	    q.push [:PRE_BEGIN, tmp]
	  elsif tmp = sc.scan(/\A\}\}\} *$/)
	    q.push [:PRE_END, tmp]
	  elsif tmp = sc.scan(/\A\.$/)
	    q.push [:ENDPERIOD, tmp]
	  elsif tmp = sc.scan(/\A[ \t\r\f]*$/) 
	    q.push [:BLANK, tmp]
	  end
	  next
	end
	if tmp = sc.scan(/\A\n/)
	  q.push [:EOL, tmp] 
	  bol=true
	elsif tmp = sc.scan(/\A\w+:[A-Z]\w+(?!:)/)
	  q.push [:INTERWIKINAME, tmp]
	elsif tmp = sc.scan(PAT_URI) 
	  if URI::extract(tmp, %w[http https ftp news mailto]).empty?
	    q.push [:OTHER, tmp]
	  else
	    q.push [:URI, tmp]
	  end
	elsif tmp = sc.scan($WIKINAMERE)
	  q.push [:WIKINAME1, tmp]
	elsif tmp = sc.scan(/\A\[\[\S+?\]\]/)
	  q.push [:WIKINAME2, tmp]
#	elsif tmp = sc.scan(/\A={1,6} *$/)
#	  q.push [:HN_END, tmp]
	elsif tmp = sc.scan(/\A +\.$/)
	  q.push [:ENDPERIOD, tmp]
	elsif tmp = sc.scan(/\A[ \t\r\f]+/)
	  q.push [:SPACE, tmp]
	elsif tmp = sc.scan(/\A\|\| *$/)
	  q.push [:TABLE_END, tmp]
	elsif tmp = sc.scan(/\A\|\|/)
	  q.push [:TABLE, tmp]
	elsif tmp = sc.scan(/\A\[img:#{URI::REGEXP::PATTERN::X_ABS_URI}\s+[^]]+?\]/xn)
	  q.push [:MOINHREFIMG, tmp]
	# elsif tmp = sc.scan(/\A\[\S+ +\S+?\]/)
	# elsif tmp = sc.scan(/\A\[\S+ +[^]]+?\]/)
	elsif tmp = sc.scan(/\A\[#{URI::REGEXP::PATTERN::X_ABS_URI}\s+[^]]+?\]/xn)
	  q.push [:MOINHREF, tmp]
	elsif tmp = sc.scan(/\A\{\{/)
	  q.push [:ESCAPE_BEGIN, tmp]
	elsif tmp = sc.scan(/\A\}\}/)
	  q.push [:ESCAPE_END, tmp]
	elsif tmp = sc.scan(/\A'''/)
	  q.push [:STRONG, tmp]
	elsif tmp = sc.scan(/\A''/)
	  q.push [:EM, tmp]
	elsif tmp = sc.scan(/\A[\w:]+/)
	  q.push [:WORD, tmp]
	elsif tmp = sc.scan(/\A[#{C128}-#{C255}]+/)
	  q.push [:OTHER, tmp]
	elsif tmp = sc.scan(/\A\S/e)
	  q.push [:OTHER, tmp]
	else
	  raise RangeError, 'must not happen: ' + sc.rest.inspect
	end
      end
      q.push [ :EOF, nil]
      return q
    end
  end
end




Copyright 1998-2008 Alvin Alexander
All Rights Reserved.
 
devdaily.com is based in louisville, kentucky, and this web site is hosted by godaddy.com