ruby--ruby/lib/abbrev.rb

#!/usr/bin/env ruby
#--
# Copyright (c) 2001,2003 Akinori MUSHA <knu@iDaemons.org>
#
# All rights reserved.  You can redistribute and/or modify it under
# the same terms as Ruby.
#
# $Idaemons: /home/cvs/rb/abbrev.rb,v 1.2 2001/05/30 09:37:45 knu Exp $
# $RoughId: abbrev.rb,v 1.4 2003/10/14 19:45:42 knu Exp $
# $Id$
#++

##
# Calculates the set of unique abbreviations for a given set of strings.
#
#   require 'abbrev'
#   require 'pp'
#
#   pp Abbrev.abbrev(['ruby', 'rules'])
#
# Generates:
#
#   { "rub"   =>  "ruby",
#     "ruby"  =>  "ruby",
#     "rul"   =>  "rules",
#     "rule"  =>  "rules",
#     "rules" =>  "rules" }
#
# It also provides an array core extension, Array#abbrev.
#
#   pp %w{april may}.abbrev
#   #=> {"summe"=>"summer",
#        "summ"=>"summer",
#        "sum"=>"summer",
#        "su"=>"summer",
#        "s"=>"summer",
#        "winte"=>"winter",
#        "wint"=>"winter",
#        "win"=>"winter",
#        "wi"=>"winter",
#        "w"=>"winter",
#        "summer"=>"summer",
#        "winter"=>"winter"}

module Abbrev

  # Given a set of strings, calculate the set of unambiguous
  # abbreviations for those strings, and return a hash where the keys
  # are all the possible abbreviations and the values are the full
  # strings.
  #
  # Thus, given input of "car" and "cone", the keys pointing to "car" would be
  # "ca" and "car", while those pointing to "cone" would be "co", "con", and
  # "cone".
  #
  #   require 'abbrev'
  #   require 'pp'
  #
  #   pp Abbrev.abbrev(['car', 'cone'])
  #   #=> {"ca"=>"car", "con"=>"cone", "co"=>"cone", "car"=>"car", "cone"=>"cone"}
  #
  # The optional +pattern+ parameter is a pattern or a string. Only
  # input strings that match the pattern or start with the string
  # are included in the output hash.
  #
  #   pp %w{car box cone}.abbrev(/b/)
  #   #=> {"bo"=>"box", "b"=>"box", "box"=>"box"}
  def abbrev(words, pattern = nil)
    table = {}
    seen = Hash.new(0)

    if pattern.is_a?(String)
      pattern = /^#{Regexp.quote(pattern)}/  # regard as a prefix
    end

    words.each do |word|
      next if (abbrev = word).empty?
      while (len = abbrev.rindex(/[\w\W]\z/)) > 0
        abbrev = word[0,len]

        next if pattern && pattern !~ abbrev

        case seen[abbrev] += 1
        when 1
          table[abbrev] = word
        when 2
          table.delete(abbrev)
        else
          break
        end
      end
    end

    words.each do |word|
      next if pattern && pattern !~ word

      table[word] = word
    end

    table
  end

  module_function :abbrev
end

class Array
  # Calculates the set of unambiguous abbreviations for the strings in
  # +self+.
  #
  #   abbr = %w{ car cone }.abbrev
  #   abbr #=> { "ca" => "car", "car" => "car",
  #           "co" => "cone", "con" => "cone",
  #           "cone" => "cone" }
  #
  # The optional +pattern+ parameter is a pattern or a string. Only
  # input strings that match the pattern or start with the string
  # are included in the output hash.
  #
  #   abbr = %w{ fast boat day }.abbrev(/^.a.*$/)
  #   abbr #=> {"fas"=>"fast","fa"=>"fast",
  #             "da"=>"day", "fast"=>"fast", "day"=>"day"}
  #
  # See also Abbrev.abbrev
  def abbrev(pattern = nil)
    Abbrev::abbrev(self, pattern)
  end
end

if $0 == __FILE__
  while line = gets
    hash = line.split.abbrev

    hash.sort.each do |k, v|
      puts "#{k} => #{v}"
    end
  end
end
* lib/generator.rb: A new library which converts an internal iterator to an external iterator. * lib/abbrev.rb: A new library which creates an abbreviation table from a list. git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@4767 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2003-10-14 16:14:20 -04:00			`#!/usr/bin/env ruby`
* lib/abbrev.rb: Hide copyright and revision information from RDoc. Inspired by patch from David Copeland, bug #4703. git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@31593 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2011-05-16 14:51:56 -04:00			`#--`
* lib/generator.rb: A new library which converts an internal iterator to an external iterator. * lib/abbrev.rb: A new library which creates an abbreviation table from a list. git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@4767 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2003-10-14 16:14:20 -04:00			`# Copyright (c) 2001,2003 Akinori MUSHA <knu@iDaemons.org>`
			`#`
			`# All rights reserved. You can redistribute and/or modify it under`
			`# the same terms as Ruby.`
			`#`
			`# $Idaemons: /home/cvs/rb/abbrev.rb,v 1.2 2001/05/30 09:37:45 knu Exp $`
			`# $RoughId: abbrev.rb,v 1.4 2003/10/14 19:45:42 knu Exp $`
			`# $Id$`
* lib/abbrev.rb: Hide copyright and revision information from RDoc. Inspired by patch from David Copeland, bug #4703. git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@31593 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2011-05-16 14:51:56 -04:00			`#++`
RDoc abbrev git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@5513 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2004-01-20 00:27:23 -05:00
* lib/abbrev.rb: Clarified that Abbrev.abbrev returns a Hash instead of an Array. Patch by Andrei Bocan. [ruby-trunk - Bug #6107] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@35290 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2012-04-10 16:15:05 -04:00			`##`
			`# Calculates the set of unique abbreviations for a given set of strings.`
RDoc abbrev git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@5513 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2004-01-20 00:27:23 -05:00			`#`
			`# require 'abbrev'`
			`# require 'pp'`
			`#`
* lib/abbrev.rb: Clarified that Abbrev.abbrev returns a Hash instead of an Array. Patch by Andrei Bocan. [ruby-trunk - Bug #6107] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@35290 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2012-04-10 16:15:05 -04:00			`# pp Abbrev.abbrev(['ruby', 'rules'])`
RDoc abbrev git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@5513 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2004-01-20 00:27:23 -05:00			`#`
* lib/abbrev.rb: Clarified that Abbrev.abbrev returns a Hash instead of an Array. Patch by Andrei Bocan. [ruby-trunk - Bug #6107] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@35290 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2012-04-10 16:15:05 -04:00			`# Generates:`
RDoc abbrev git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@5513 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2004-01-20 00:27:23 -05:00			`#`
* lib/abbrev.rb: Clarified that Abbrev.abbrev returns a Hash instead of an Array. Patch by Andrei Bocan. [ruby-trunk - Bug #6107] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@35290 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2012-04-10 16:15:05 -04:00			`# { "rub" => "ruby",`
			`# "ruby" => "ruby",`
			`# "rul" => "rules",`
			`# "rule" => "rules",`
			`# "rules" => "rules" }`
RDoc abbrev git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@5513 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2004-01-20 00:27:23 -05:00			`#`
* lib/abbrev.rb: Documentation examples for Abbrev. [ruby-dev:47442] [Bug #6985] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@37113 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2012-10-06 16:03:26 -04:00			`# It also provides an array core extension, Array#abbrev.`
			`#`
			`# pp %w{april may}.abbrev`
			`# #=> {"summe"=>"summer",`
			`# "summ"=>"summer",`
			`# "sum"=>"summer",`
			`# "su"=>"summer",`
			`# "s"=>"summer",`
			`# "winte"=>"winter",`
			`# "wint"=>"winter",`
			`# "win"=>"winter",`
			`# "wi"=>"winter",`
			`# "w"=>"winter",`
			`# "summer"=>"summer",`
			`# "winter"=>"winter"}`
* lib/generator.rb: A new library which converts an internal iterator to an external iterator. * lib/abbrev.rb: A new library which creates an abbreviation table from a list. git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@4767 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2003-10-14 16:14:20 -04:00
			`module Abbrev`
RDoc abbrev git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@5513 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2004-01-20 00:27:23 -05:00
			`# Given a set of strings, calculate the set of unambiguous`
			`# abbreviations for those strings, and return a hash where the keys`
			`# are all the possible abbreviations and the values are the full`
* lib/abbrev.rb: Documentation examples for Abbrev. [ruby-dev:47442] [Bug #6985] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@37113 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2012-10-06 16:03:26 -04:00			`# strings.`
			`#`
			`# Thus, given input of "car" and "cone", the keys pointing to "car" would be`
			`# "ca" and "car", while those pointing to "cone" would be "co", "con", and`
			`# "cone".`
			`#`
			`# require 'abbrev'`
			`# require 'pp'`
			`#`
			`# pp Abbrev.abbrev(['car', 'cone'])`
			`# #=> {"ca"=>"car", "con"=>"cone", "co"=>"cone", "car"=>"car", "cone"=>"cone"}`
RDoc abbrev git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@5513 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2004-01-20 00:27:23 -05:00			`#`
			`# The optional +pattern+ parameter is a pattern or a string. Only`
* lib/abbrev.rb: Fixed typo in abbrev pattern documentation. Based on patch by Mark Rushakoff. [ruby-trunk - #6346] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@35584 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2012-05-07 19:55:53 -04:00			`# input strings that match the pattern or start with the string`
			`# are included in the output hash.`
* lib/abbrev.rb: Documentation examples for Abbrev. [ruby-dev:47442] [Bug #6985] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@37113 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2012-10-06 16:03:26 -04:00			`#`
			`# pp %w{car box cone}.abbrev(/b/)`
			`# #=> {"bo"=>"box", "b"=>"box", "box"=>"box"}`
* lib/generator.rb: A new library which converts an internal iterator to an external iterator. * lib/abbrev.rb: A new library which creates an abbreviation table from a list. git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@4767 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2003-10-14 16:14:20 -04:00			`def abbrev(words, pattern = nil)`
			`table = {}`
			`seen = Hash.new(0)`

			`if pattern.is_a?(String)`
* lib: Convert tabs to spaces for ruby files per http://redmine.ruby-lang.org/projects/ruby/wiki/DeveloperHowto#coding-style Patch by Steve Klabnik [Ruby 1.9 - Bug #4730] Patch by Jason Dew [Ruby 1.9 - Feature #4718] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@31635 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2011-05-18 17:19:18 -04:00			`pattern = /^#{Regexp.quote(pattern)}/ # regard as a prefix`
* lib/generator.rb: A new library which converts an internal iterator to an external iterator. * lib/abbrev.rb: A new library which creates an abbreviation table from a list. git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@4767 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2003-10-14 16:14:20 -04:00			`end`

			`words.each do \|word\|`
			`next if (abbrev = word).empty?`
			`while (len = abbrev.rindex(/[\w\W]\z/)) > 0`
* lib: Convert tabs to spaces for ruby files per http://redmine.ruby-lang.org/projects/ruby/wiki/DeveloperHowto#coding-style Patch by Steve Klabnik [Ruby 1.9 - Bug #4730] Patch by Jason Dew [Ruby 1.9 - Feature #4718] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@31635 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2011-05-18 17:19:18 -04:00			`abbrev = word[0,len]`
* lib/generator.rb: A new library which converts an internal iterator to an external iterator. * lib/abbrev.rb: A new library which creates an abbreviation table from a list. git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@4767 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2003-10-14 16:14:20 -04:00
* lib: Convert tabs to spaces for ruby files per http://redmine.ruby-lang.org/projects/ruby/wiki/DeveloperHowto#coding-style Patch by Steve Klabnik [Ruby 1.9 - Bug #4730] Patch by Jason Dew [Ruby 1.9 - Feature #4718] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@31635 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2011-05-18 17:19:18 -04:00			`next if pattern && pattern !~ abbrev`
* lib/generator.rb: A new library which converts an internal iterator to an external iterator. * lib/abbrev.rb: A new library which creates an abbreviation table from a list. git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@4767 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2003-10-14 16:14:20 -04:00
* lib: Convert tabs to spaces for ruby files per http://redmine.ruby-lang.org/projects/ruby/wiki/DeveloperHowto#coding-style Patch by Steve Klabnik [Ruby 1.9 - Bug #4730] Patch by Jason Dew [Ruby 1.9 - Feature #4718] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@31635 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2011-05-18 17:19:18 -04:00			`case seen[abbrev] += 1`
			`when 1`
			`table[abbrev] = word`
			`when 2`
			`table.delete(abbrev)`
			`else`
			`break`
			`end`
* lib/generator.rb: A new library which converts an internal iterator to an external iterator. * lib/abbrev.rb: A new library which creates an abbreviation table from a list. git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@4767 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2003-10-14 16:14:20 -04:00			`end`
			`end`

			`words.each do \|word\|`
			`next if pattern && pattern !~ word`

			`table[word] = word`
			`end`

			`table`
			`end`

			`module_function :abbrev`
			`end`

			`class Array`
RDoc abbrev git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@5513 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2004-01-20 00:27:23 -05:00			`# Calculates the set of unambiguous abbreviations for the strings in`
* lib/abbrev.rb: Fixed typo in abbrev pattern documentation. Based on patch by Mark Rushakoff. [ruby-trunk - #6346] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@35584 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2012-05-07 19:55:53 -04:00			`# +self+.`
			`#`
* lib/abbrev.rb: Documentation examples for Abbrev. [ruby-dev:47442] [Bug #6985] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@37113 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2012-10-06 16:03:26 -04:00			`# abbr = %w{ car cone }.abbrev`
			`# abbr #=> { "ca" => "car", "car" => "car",`
			`# "co" => "cone", "con" => "cone",`
			`# "cone" => "cone" }`
			`#`
* lib/abbrev.rb: Fixed typo in abbrev pattern documentation. Based on patch by Mark Rushakoff. [ruby-trunk - #6346] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@35584 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2012-05-07 19:55:53 -04:00			`# The optional +pattern+ parameter is a pattern or a string. Only`
			`# input strings that match the pattern or start with the string`
			`# are included in the output hash.`
RDoc abbrev git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@5513 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2004-01-20 00:27:23 -05:00			`#`
* lib/abbrev.rb: Documentation examples for Abbrev. [ruby-dev:47442] [Bug #6985] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@37113 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2012-10-06 16:03:26 -04:00			`# abbr = %w{ fast boat day }.abbrev(/^.a.*$/)`
			`# abbr #=> {"fas"=>"fast","fa"=>"fast",`
			`# "da"=>"day", "fast"=>"fast", "day"=>"day"}`
* lib/abbrev.rb: Fixed typo in abbrev pattern documentation. Based on patch by Mark Rushakoff. [ruby-trunk - #6346] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@35584 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2012-05-07 19:55:53 -04:00			`#`
* lib/abbrev.rb: Documentation examples for Abbrev. [ruby-dev:47442] [Bug #6985] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@37113 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2012-10-06 16:03:26 -04:00			`# See also Abbrev.abbrev`
* lib/generator.rb: A new library which converts an internal iterator to an external iterator. * lib/abbrev.rb: A new library which creates an abbreviation table from a list. git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@4767 b2dd03c8-39d4-4d8f-98ff-823fe69b080e 2003-10-14 16:14:20 -04:00			`def abbrev(pattern = nil)`
			`Abbrev::abbrev(self, pattern)`
			`end`
			`end`

			`if $0 == __FILE__`
			`while line = gets`
			`hash = line.split.abbrev`

			`hash.sort.each do \|k, v\|`
			`puts "#{k} => #{v}"`
			`end`
			`end`
			`end`