From 61dc0d24f56e616387a9379cd1992e96d0be1945 Mon Sep 17 00:00:00 2001 From: Jens Wille Date: Mon, 9 Feb 2015 11:23:18 +0100 Subject: [PATCH] v1.8.6 --- ChangeLog | 2 +- README | 4 ++-- lib/lingo/version.rb | 2 +- lingo.gemspec | 38 +++++++++++++++++++------------------- 4 files changed, 23 insertions(+), 23 deletions(-) diff --git a/ChangeLog b/ChangeLog index 48e9969d..e267adb7 100644 --- a/ChangeLog +++ b/ChangeLog @@ -2,7 +2,7 @@ = Revision history for Lingo -== 1.8.6 [unreleased] +== 1.8.6 [2015-02-09] * Lingo::Attendee::VectorFilter learned +pos+ option to print position and byte offset with each word. diff --git a/README b/README index 4725aa96..cd61a0e3 100644 --- a/README +++ b/README @@ -35,7 +35,7 @@ == VERSION -This documentation refers to Lingo version 1.8.5 +This documentation refers to Lingo version 1.8.6 == DESCRIPTION @@ -584,7 +584,7 @@ Lingo is based on a collective development by Klaus Lepsky and John Vorhauer. == LICENSE AND COPYRIGHT Copyright (C) 2005-2007 John Vorhauer -Copyright (C) 2007-2014 John Vorhauer, Jens Wille +Copyright (C) 2007-2015 John Vorhauer, Jens Wille Lingo is free software: you can redistribute it and/or modify it under the terms of the GNU Affero General Public License as published by the Free diff --git a/lib/lingo/version.rb b/lib/lingo/version.rb index e8dcfed0..cc10b0f8 100644 --- a/lib/lingo/version.rb +++ b/lib/lingo/version.rb @@ -4,7 +4,7 @@ module Version MAJOR = 1 MINOR = 8 - TINY = 5 + TINY = 6 class << self diff --git a/lingo.gemspec b/lingo.gemspec index 6fe71fd5..a246eaa5 100644 --- a/lingo.gemspec +++ b/lingo.gemspec @@ -1,63 +1,63 @@ # -*- encoding: utf-8 -*- -# stub: lingo 1.8.5 ruby lib +# stub: lingo 1.8.6 ruby lib Gem::Specification.new do |s| s.name = "lingo" - s.version = "1.8.5" + s.version = "1.8.6" s.required_rubygems_version = Gem::Requirement.new(">= 0") if s.respond_to? :required_rubygems_version= s.require_paths = ["lib"] s.authors = ["John Vorhauer", "Jens Wille"] - s.date = "2014-10-02" + s.date = "2015-02-09" s.description = "Lingo is an open source indexing system for research and teachings.\nThe main functions of Lingo are:\n\n* identification of (i.e. reduction to) basic word form by means of\n dictionaries and suffix lists\n* algorithmic decomposition\n* dictionary-based synonymisation and identification of phrases\n* generic identification of phrases/word sequences based on patterns\n of word classes\n" s.email = ["lingo@vorhauer.de", "jens.wille@gmail.com"] s.executables = ["lingo", "lingoctl", "lingosrv", "lingoweb"] s.extra_rdoc_files = ["README", "COPYING", "ChangeLog"] - s.files = ["COPYING", "ChangeLog", "README", "Rakefile", "bin/lingo", "bin/lingoctl", "bin/lingosrv", "bin/lingoweb", "de.lang", "de/lingo-abk.txt", "de/lingo-dic.txt", "de/lingo-mul.txt", "de/lingo-syn.txt", "de/test_dic.txt", "de/test_gen.txt", "de/test_mu2.txt", "de/test_mul.txt", "de/test_sgw.txt", "de/test_syn.txt", "de/user-dic.txt", "en.lang", "en/lingo-dic.txt", "en/lingo-irr.txt", "en/lingo-mul.txt", "en/lingo-syn.txt", "en/lingo-wdn.txt", "en/user-dic.txt", "lib/lingo.rb", "lib/lingo/agenda_item.rb", "lib/lingo/app.rb", "lib/lingo/attendee.rb", "lib/lingo/attendee/abbreviator.rb", "lib/lingo/attendee/debugger.rb", "lib/lingo/attendee/decomposer.rb", "lib/lingo/attendee/dehyphenizer.rb", "lib/lingo/attendee/formatter.rb", "lib/lingo/attendee/multi_worder.rb", "lib/lingo/attendee/noneword_filter.rb", "lib/lingo/attendee/object_filter.rb", "lib/lingo/attendee/sequencer.rb", "lib/lingo/attendee/stemmer.rb", "lib/lingo/attendee/stemmer/porter.rb", "lib/lingo/attendee/synonymer.rb", "lib/lingo/attendee/text_reader.rb", "lib/lingo/attendee/text_writer.rb", "lib/lingo/attendee/tokenizer.rb", "lib/lingo/attendee/variator.rb", "lib/lingo/attendee/vector_filter.rb", "lib/lingo/attendee/word_searcher.rb", "lib/lingo/buffered_attendee.rb", "lib/lingo/call.rb", "lib/lingo/cli.rb", "lib/lingo/config.rb", "lib/lingo/ctl.rb", "lib/lingo/database.rb", "lib/lingo/database/crypter.rb", "lib/lingo/database/gdbm_store.rb", "lib/lingo/database/hash_store.rb", "lib/lingo/database/libcdb_store.rb", "lib/lingo/database/progress.rb", "lib/lingo/database/sdbm_store.rb", "lib/lingo/database/source.rb", "lib/lingo/database/source/key_value.rb", "lib/lingo/database/source/multi_key.rb", "lib/lingo/database/source/multi_value.rb", "lib/lingo/database/source/single_word.rb", "lib/lingo/database/source/word_class.rb", "lib/lingo/debug.rb", "lib/lingo/error.rb", "lib/lingo/language.rb", "lib/lingo/language/char.rb", "lib/lingo/language/dictionary.rb", "lib/lingo/language/grammar.rb", "lib/lingo/language/lexical.rb", "lib/lingo/language/lexical_hash.rb", "lib/lingo/language/token.rb", "lib/lingo/language/word.rb", "lib/lingo/language/word_form.rb", "lib/lingo/progress.rb", "lib/lingo/srv.rb", "lib/lingo/srv/config.ru", "lib/lingo/srv/lingosrv.cfg", "lib/lingo/srv/public/.gitkeep", "lib/lingo/version.rb", "lib/lingo/web.rb", "lib/lingo/web/config.ru", "lib/lingo/web/lingoweb.cfg", "lib/lingo/web/public/lingo.png", "lib/lingo/web/public/lingoweb.css", "lib/lingo/web/views/index.erb", "lingo-call.cfg", "lingo.cfg", "lingo.rb", "lir.cfg", "ru.lang", "ru/lingo-dic.txt", "ru/lingo-mul.txt", "ru/lingo-syn.txt", "ru/user-dic.txt", "spec/spec_helper.rb", "test/attendee/ts_abbreviator.rb", "test/attendee/ts_decomposer.rb", "test/attendee/ts_multi_worder.rb", "test/attendee/ts_noneword_filter.rb", "test/attendee/ts_object_filter.rb", "test/attendee/ts_sequencer.rb", "test/attendee/ts_stemmer.rb", "test/attendee/ts_synonymer.rb", "test/attendee/ts_text_reader.rb", "test/attendee/ts_text_writer.rb", "test/attendee/ts_tokenizer.rb", "test/attendee/ts_variator.rb", "test/attendee/ts_vector_filter.rb", "test/attendee/ts_word_searcher.rb", "test/lir.txt", "test/lir.vec", "test/lir2.txt", "test/mul.txt", "test/ref/artikel.mul", "test/ref/artikel.non", "test/ref/artikel.seq", "test/ref/artikel.syn", "test/ref/artikel.vec", "test/ref/artikel.ven", "test/ref/artikel.ver", "test/ref/lir.mul", "test/ref/lir.non", "test/ref/lir.seq", "test/ref/lir.syn", "test/ref/lir.vec", "test/test_helper.rb", "test/ts_database.rb", "test/ts_language.rb", "txt/artikel-en.txt", "txt/artikel-ru.txt", "txt/artikel.txt", "txt/lir.txt"] + s.files = ["COPYING", "ChangeLog", "README", "Rakefile", "bin/lingo", "bin/lingoctl", "bin/lingosrv", "bin/lingoweb", "config/lingo-call.cfg", "config/lingo.cfg", "config/lir.cfg", "dict/de/lingo-abk.txt", "dict/de/lingo-dic.txt", "dict/de/lingo-mul.txt", "dict/de/lingo-syn.txt", "dict/de/test_dic.txt", "dict/de/test_gen.txt", "dict/de/test_mu2.txt", "dict/de/test_mul.txt", "dict/de/test_sgw.txt", "dict/de/test_syn.txt", "dict/de/user-dic.txt", "dict/en/lingo-dic.txt", "dict/en/lingo-irr.txt", "dict/en/lingo-mul.txt", "dict/en/lingo-syn.txt", "dict/en/lingo-wdn.txt", "dict/en/user-dic.txt", "dict/ru/lingo-dic.txt", "dict/ru/lingo-mul.txt", "dict/ru/lingo-syn.txt", "dict/ru/user-dic.txt", "lang/de.lang", "lang/en.lang", "lang/ru.lang", "lib/lingo.rb", "lib/lingo/app.rb", "lib/lingo/attendee.rb", "lib/lingo/attendee/abbreviator.rb", "lib/lingo/attendee/debugger.rb", "lib/lingo/attendee/decomposer.rb", "lib/lingo/attendee/dehyphenizer.rb", "lib/lingo/attendee/formatter.rb", "lib/lingo/attendee/multi_worder.rb", "lib/lingo/attendee/noneword_filter.rb", "lib/lingo/attendee/object_filter.rb", "lib/lingo/attendee/sequencer.rb", "lib/lingo/attendee/stemmer.rb", "lib/lingo/attendee/stemmer/porter.rb", "lib/lingo/attendee/synonymer.rb", "lib/lingo/attendee/text_reader.rb", "lib/lingo/attendee/text_writer.rb", "lib/lingo/attendee/tokenizer.rb", "lib/lingo/attendee/variator.rb", "lib/lingo/attendee/vector_filter.rb", "lib/lingo/attendee/word_searcher.rb", "lib/lingo/buffered_attendee.rb", "lib/lingo/call.rb", "lib/lingo/cli.rb", "lib/lingo/config.rb", "lib/lingo/ctl.rb", "lib/lingo/database.rb", "lib/lingo/database/crypter.rb", "lib/lingo/database/gdbm_store.rb", "lib/lingo/database/hash_store.rb", "lib/lingo/database/libcdb_store.rb", "lib/lingo/database/progress.rb", "lib/lingo/database/sdbm_store.rb", "lib/lingo/database/source.rb", "lib/lingo/database/source/key_value.rb", "lib/lingo/database/source/multi_key.rb", "lib/lingo/database/source/multi_value.rb", "lib/lingo/database/source/single_word.rb", "lib/lingo/database/source/word_class.rb", "lib/lingo/debug.rb", "lib/lingo/deferred_attendee.rb", "lib/lingo/error.rb", "lib/lingo/language.rb", "lib/lingo/language/char.rb", "lib/lingo/language/dictionary.rb", "lib/lingo/language/grammar.rb", "lib/lingo/language/lexical.rb", "lib/lingo/language/lexical_hash.rb", "lib/lingo/language/token.rb", "lib/lingo/language/word.rb", "lib/lingo/language/word_form.rb", "lib/lingo/progress.rb", "lib/lingo/srv.rb", "lib/lingo/srv/config.ru", "lib/lingo/srv/lingosrv.cfg", "lib/lingo/srv/public/.gitkeep", "lib/lingo/version.rb", "lib/lingo/web.rb", "lib/lingo/web/config.ru", "lib/lingo/web/lingoweb.cfg", "lib/lingo/web/public/lingo.png", "lib/lingo/web/public/lingoweb.css", "lib/lingo/web/views/index.erb", "test/attendee/ts_abbreviator.rb", "test/attendee/ts_decomposer.rb", "test/attendee/ts_multi_worder.rb", "test/attendee/ts_noneword_filter.rb", "test/attendee/ts_object_filter.rb", "test/attendee/ts_sequencer.rb", "test/attendee/ts_stemmer.rb", "test/attendee/ts_synonymer.rb", "test/attendee/ts_text_reader.rb", "test/attendee/ts_text_writer.rb", "test/attendee/ts_tokenizer.rb", "test/attendee/ts_variator.rb", "test/attendee/ts_vector_filter.rb", "test/attendee/ts_word_searcher.rb", "test/lir.txt", "test/lir.vec", "test/lir2.txt", "test/mul.txt", "test/ref/artikel.mul", "test/ref/artikel.non", "test/ref/artikel.seq", "test/ref/artikel.syn", "test/ref/artikel.vec", "test/ref/artikel.vef", "test/ref/artikel.ven", "test/ref/artikel.ver", "test/ref/artikel.vet", "test/ref/lir.mul", "test/ref/lir.non", "test/ref/lir.seq", "test/ref/lir.syn", "test/ref/lir.vec", "test/ref/lir.vef", "test/ref/lir.ven", "test/ref/lir.ver", "test/ref/lir.vet", "test/test_helper.rb", "test/ts_database.rb", "test/ts_language.rb", "txt/artikel-en.txt", "txt/artikel-ru.txt", "txt/artikel.txt", "txt/lir.txt"] s.homepage = "http://lex-lingo.de" s.licenses = ["AGPL-3.0"] - s.post_install_message = "\nlingo-1.8.5 [2014-10-02]:\n\n* Dictionary values (projections) are no longer sorted; hence, order of\n definition affects processing.\n* Lexicals in Lingo::Language::Word are no longer sorted; in particular,\n compound parts keep their original order.\n* Lexicals in Lingo::Language::Word are no longer cleaned from duplicates.\n* Compiled dictionaries are updated whenever the Lingo version or their\n configuration changes, not only when the source file's size or modification\n time changes.\n* Lingo::Attendee::Synonymer learned compound-parts option to also\n generate synonyms for compound parts when set to +true+.\n* Lingo::Attendee::TextReader learned better PDF-to-text conversion using the\n +pdftotext+ command; specify filter: pdftotext in the config.\n* Lingo::Attendee::VectorFilter learned +dict+ option to print words in\n dictionary format (viz. Lingo::Database::Source::WordClass).\n* Lingo::Attendee::VectorFilter learned +preamble+ option to print current\n configuration to the beginning of the log file (debug: 'true');\n set preamble: false to disable.\n* Multiword dictionaries compiled from base forms can now generate inflected\n adjectives based on the gender of the head noun; set inflect: true\n in the dictionary config.\n* Lingo::Database::Source::WordClass supports gender information being encoded\n in the dictionary as well as shorthand notation for multiple word\n classes/genders.\n* Lingo::Database::Source::WordClass supports compounds being encoded in the\n dictionary (appending + to their parts' word classes is\n recommended).\n* Lingo::Database::Source removes leading and trailing whitespace from\n dictionary lines.\n* Lingo::Database::Crypter uses OpenSSL to encrypt/decrypt dictionaries.\n Note: Can't decrypt dictionaries encrypted with the old scheme anymore.\n* Lingo::Attendee::Tokenizer learned subset of MediaWiki syntax.\n* Eliminated pathological behaviour of the +URLS+ rule in\n Lingo::Attendee::Tokenizer.\n* Fixed regression introduced in 1.8.2 where combine: all would no\n longer work in Lingo::Attendee::MultiWorder.\n* Updated and extended Russian dictionaries. (Yulia Dorokhova, Thomas M\u{fc}ller)\n* +lingoctl+ no longer overwrites existing files without confirmation.\n* +lingoctl+ learned +archive+ command.\n* Dictionary cleanup.\n\n" - s.rdoc_options = ["--title", "lingo Application documentation (v1.8.5)", "--charset", "UTF-8", "--line-numbers", "--all", "--main", "README"] + s.post_install_message = "\nlingo-1.8.6 [2015-02-09]:\n\n* Lingo::Attendee::VectorFilter learned +pos+ option to print position and\n byte offset with each word.\n* Lingo::Attendee::VectorFilter learned +tfidf+ option to sort results based\n on their tf\u{2013}idf[https://en.wikipedia.org/wiki/Tf\u{2013}idf] score; the document\n frequencies are calculated over the \"corpus\" of all files processed during\n a single program invocation.\n* Lingo::Attendee::VectorFilter learned +tokens+ option to filter on\n Lingo::Language::Token in addition to Lingo::Language::Word.\n* Lingo::Attendee::VectorFilter no longer supports +debug+ (as well as\n +prompt+ and +preamble+); use Lingo::Attendee::DebugFilter instead.\n* Lingo::Attendee::TextReader no longer removes line endings; option +chomp+\n is obsolete.\n* Lingo::Attendee::TextReader passes byte offset to the following attendee.\n* Lingo::Attendee::Tokenizer records token's byte offset.\n* Lingo::Attendee::Tokenizer records token's sequence position.\n* Lingo::Attendee::Tokenizer learned skip-tags option to skip over\n specified tags' contents.\n* Lingo::Attendee subclasses warn when invalid or obsolete options or names\n are used.\n* Changed German infix substitution +/en+ to +ch/chen+ in order to prevent\n overly aggressive identifications.\n* Internal refactoring and API changes.\n\n" + s.rdoc_options = ["--title", "lingo Application documentation (v1.8.6)", "--charset", "UTF-8", "--line-numbers", "--all", "--main", "README"] s.required_ruby_version = Gem::Requirement.new(">= 1.9.3") - s.rubygems_version = "2.4.2" + s.rubygems_version = "2.4.5" s.summary = "The full-featured automatic indexing system" if s.respond_to? :specification_version then s.specification_version = 4 if Gem::Version.new(Gem::VERSION) >= Gem::Version.new('1.2.0') then - s.add_runtime_dependency(%q, [">= 0.0.4", "~> 0.0"]) - s.add_runtime_dependency(%q, ["~> 1.0"]) + s.add_runtime_dependency(%q, ["~> 0.1"]) + s.add_runtime_dependency(%q, ["~> 1.1"]) s.add_runtime_dependency(%q, ["~> 1.1"]) s.add_runtime_dependency(%q, ["~> 0.0"]) s.add_runtime_dependency(%q, ["~> 0.4"]) s.add_development_dependency(%q, ["~> 1.2"]) s.add_development_dependency(%q, ["~> 1.3"]) - s.add_development_dependency(%q, [">= 0"]) + s.add_development_dependency(%q, [">= 0.8.1", "~> 0.8"]) s.add_development_dependency(%q, [">= 0"]) - s.add_development_dependency(%q, [">= 0"]) + s.add_development_dependency(%q, [">= 0"]) else - s.add_dependency(%q, [">= 0.0.4", "~> 0.0"]) - s.add_dependency(%q, ["~> 1.0"]) + s.add_dependency(%q, ["~> 0.1"]) + s.add_dependency(%q, ["~> 1.1"]) s.add_dependency(%q, ["~> 1.1"]) s.add_dependency(%q, ["~> 0.0"]) s.add_dependency(%q, ["~> 0.4"]) s.add_dependency(%q, ["~> 1.2"]) s.add_dependency(%q, ["~> 1.3"]) - s.add_dependency(%q, [">= 0"]) + s.add_dependency(%q, [">= 0.8.1", "~> 0.8"]) s.add_dependency(%q, [">= 0"]) - s.add_dependency(%q, [">= 0"]) + s.add_dependency(%q, [">= 0"]) end else - s.add_dependency(%q, [">= 0.0.4", "~> 0.0"]) - s.add_dependency(%q, ["~> 1.0"]) + s.add_dependency(%q, ["~> 0.1"]) + s.add_dependency(%q, ["~> 1.1"]) s.add_dependency(%q, ["~> 1.1"]) s.add_dependency(%q, ["~> 0.0"]) s.add_dependency(%q, ["~> 0.4"]) s.add_dependency(%q, ["~> 1.2"]) s.add_dependency(%q, ["~> 1.3"]) - s.add_dependency(%q, [">= 0"]) + s.add_dependency(%q, [">= 0.8.1", "~> 0.8"]) s.add_dependency(%q, [">= 0"]) - s.add_dependency(%q, [">= 0"]) + s.add_dependency(%q, [">= 0"]) end end