diff options
Diffstat (limited to 'lib')
-rw-r--r-- | lib/Ninka.pm | 26 | ||||
-rw-r--r-- | lib/Ninka/CommentExtractor.pm | 24 | ||||
-rw-r--r-- | lib/Ninka/Copyright.SCOWL | 230 | ||||
-rw-r--r-- | lib/Ninka/FileCleaner.pm | 24 | ||||
-rw-r--r-- | lib/Ninka/LicenseMatcher.pm | 22 | ||||
-rw-r--r-- | lib/Ninka/LicenseRules.pm | 22 | ||||
-rw-r--r-- | lib/Ninka/README.txt | 9 | ||||
-rw-r--r-- | lib/Ninka/SentenceExtractor.pm | 15 |
8 files changed, 73 insertions, 299 deletions
diff --git a/lib/Ninka.pm b/lib/Ninka.pm index dc9fbff..8f454cd 100644 --- a/lib/Ninka.pm +++ b/lib/Ninka.pm @@ -68,7 +68,7 @@ __END__ =head1 NAME -Ninka - Find licenses in source files. +Ninka - source file license identification tool =head1 SYNOPSIS @@ -82,23 +82,23 @@ Ninka - Find licenses in source files. =head1 DESCRIPTION -Scans a file and returns the found licenses. +Scans a source file and returns the found licenses. =head1 COPYRIGHT AND LICENSE - Copyright (C) 2009-2014 Yuki Manabe and Daniel M. German +Copyright (C) 2009-2014 Yuki Manabe and Daniel M. German - This program is free software: you can redistribute it and/or modify - it under the terms of the GNU General Public License as - published by the Free Software Foundation; either version 2 of the - License, or (at your option) any later version. +This program is free software: you can redistribute it and/or modify +it under the terms of the GNU General Public License as +published by the Free Software Foundation; either version 2 of the +License, or (at your option) any later version. - This program is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - GNU General Public License for more details. +This program is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +GNU General Public License for more details. - You should have received a copy of the GNU General Public License - along with this program. If not, see <http://www.gnu.org/licenses/>. +You should have received a copy of the GNU General Public License +along with this program. If not, see <http://www.gnu.org/licenses/>. =cut diff --git a/lib/Ninka/CommentExtractor.pm b/lib/Ninka/CommentExtractor.pm index fd62c02..8a2e66f 100644 --- a/lib/Ninka/CommentExtractor.pm +++ b/lib/Ninka/CommentExtractor.pm @@ -93,19 +93,19 @@ If no comment extractor is known for a language, then extracts top lines from so =head1 COPYRIGHT AND LICENSE - Copyright (C) 2009-2014 Yuki Manabe and Daniel M. German +Copyright (C) 2009-2014 Yuki Manabe and Daniel M. German - This program is free software: you can redistribute it and/or modify - it under the terms of the GNU General Public License as - published by the Free Software Foundation; either version 2 of the - License, or (at your option) any later version. +This program is free software: you can redistribute it and/or modify +it under the terms of the GNU General Public License as +published by the Free Software Foundation; either version 2 of the +License, or (at your option) any later version. - This program is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - GNU General Public License for more details. +This program is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +GNU General Public License for more details. - You should have received a copy of the GNU General Public License - along with this program. If not, see <http://www.gnu.org/licenses/>. +You should have received a copy of the GNU General Public License +along with this program. If not, see <http://www.gnu.org/licenses/>. -=cut
\ No newline at end of file +=cut diff --git a/lib/Ninka/Copyright.SCOWL b/lib/Ninka/Copyright.SCOWL deleted file mode 100644 index a4654a3..0000000 --- a/lib/Ninka/Copyright.SCOWL +++ /dev/null @@ -1,230 +0,0 @@ -The collective work is Copyright 2000-2015 by Kevin Atkinson as well -as any of the copyrights mentioned below: - - Copyright 2000-2015 by Kevin Atkinson - - Permission to use, copy, modify, distribute and sell these word - lists, the associated scripts, the output created from the scripts, - and its documentation for any purpose is hereby granted without fee, - provided that the above copyright notice appears in all copies and - that both that copyright notice and this permission notice appear in - supporting documentation. Kevin Atkinson makes no representations - about the suitability of this array for any purpose. It is provided - "as is" without express or implied warranty. - -Alan Beale <biljir@pobox.com> also deserves special credit as he has, -in addition to providing the 12Dicts package and being a major -contributor to the ENABLE word list, given me an incredible amount of -feedback and created a number of special lists (those found in the -Supplement) in order to help improve the overall quality of SCOWL. - -The 10 level includes the 1000 most common English words (according to -the Moby (TM) Words II [MWords] package), a subset of the 1000 most -common words on the Internet (again, according to Moby Words II), and -frequently class 16 from Brian Kelk's "UK English Wordlist -with Frequency Classification". - -The MWords package was explicitly placed in the public domain: - - The Moby lexicon project is complete and has - been place into the public domain. Use, sell, - rework, excerpt and use in any way on any platform. - - Placing this material on internal or public servers is - also encouraged. The compiler is not aware of any - export restrictions so freely distribute world-wide. - - You can verify the public domain status by contacting - - Grady Ward - 3449 Martha Ct. - Arcata, CA 95521-4884 - - grady@netcom.com - grady@northcoast.com - -The "UK English Wordlist With Frequency Classification" is also in the -Public Domain: - - Date: Sat, 08 Jul 2000 20:27:21 +0100 - From: Brian Kelk <Brian.Kelk@cl.cam.ac.uk> - - > I was wondering what the copyright status of your "UK English - > Wordlist With Frequency Classification" word list as it seems to - > be lacking any copyright notice. - - There were many many sources in total, but any text marked - "copyright" was avoided. Locally-written documentation was one - source. An earlier version of the list resided in a filespace called - PUBLIC on the University mainframe, because it was considered public - domain. - - Date: Tue, 11 Jul 2000 19:31:34 +0100 - - > So are you saying your word list is also in the public domain? - - That is the intention. - -The 20 level includes frequency classes 7-15 from Brian's word list. - -The 35 level includes frequency classes 2-6 and words appearing in at -least 11 of 12 dictionaries as indicated in the 12Dicts package. All -words from the 12Dicts package have had likely inflections added via -my inflection database. - -The 12Dicts package and Supplement is in the Public Domain. - -The WordNet database, which was used in the creation of the -Inflections database, is under the following copyright: - - This software and database is being provided to you, the LICENSEE, - by Princeton University under the following license. By obtaining, - using and/or copying this software and database, you agree that you - have read, understood, and will comply with these terms and - conditions.: - - Permission to use, copy, modify and distribute this software and - database and its documentation for any purpose and without fee or - royalty is hereby granted, provided that you agree to comply with - the following copyright notice and statements, including the - disclaimer, and that the same appear on ALL copies of the software, - database and documentation, including modifications that you make - for internal use or for distribution. - - WordNet 1.6 Copyright 1997 by Princeton University. All rights - reserved. - - THIS SOFTWARE AND DATABASE IS PROVIDED "AS IS" AND PRINCETON - UNIVERSITY MAKES NO REPRESENTATIONS OR WARRANTIES, EXPRESS OR - IMPLIED. BY WAY OF EXAMPLE, BUT NOT LIMITATION, PRINCETON - UNIVERSITY MAKES NO REPRESENTATIONS OR WARRANTIES OF MERCHANT- - ABILITY OR FITNESS FOR ANY PARTICULAR PURPOSE OR THAT THE USE OF THE - LICENSED SOFTWARE, DATABASE OR DOCUMENTATION WILL NOT INFRINGE ANY - THIRD PARTY PATENTS, COPYRIGHTS, TRADEMARKS OR OTHER RIGHTS. - - The name of Princeton University or Princeton may not be used in - advertising or publicity pertaining to distribution of the software - and/or database. Title to copyright in this software, database and - any associated documentation shall at all times remain with - Princeton University and LICENSEE agrees to preserve same. - -The 40 level includes words from Alan's 3esl list found in version 4.0 -of his 12dicts package. Like his other stuff the 3esl list is also in the -public domain. - -The 50 level includes Brian's frequency class 1, words appearing -in at least 5 of 12 of the dictionaries as indicated in the 12Dicts -package, and uppercase words in at least 4 of the previous 12 -dictionaries. A decent number of proper names is also included: The -top 1000 male, female, and Last names from the 1990 Census report; a -list of names sent to me by Alan Beale; and a few names that I added -myself. Finally a small list of abbreviations not commonly found in -other word lists is included. - -The name files form the Census report is a government document which I -don't think can be copyrighted. - -The file special-jargon.50 uses common.lst and word.lst from the -"Unofficial Jargon File Word Lists" which is derived from "The Jargon -File". All of which is in the Public Domain. This file also contain -a few extra UNIX terms which are found in the file "unix-terms" in the -special/ directory. - -The 55 level includes words from Alan's 2of4brif list found in version -4.0 of his 12dicts package. Like his other stuff the 2of4brif is also -in the public domain. - -The 60 level includes all words appearing in at least 2 of the 12 -dictionaries as indicated by the 12Dicts package. - -The 70 level includes Brian's frequency class 0 and the 74,550 common -dictionary words from the MWords package. The common dictionary words, -like those from the 12Dicts package, have had all likely inflections -added. The 70 level also included the 5desk list from version 4.0 of -the 12Dics package which is in the public domain. - -The 80 level includes the ENABLE word list, all the lists in the -ENABLE supplement package (except for ABLE), the "UK Advanced Cryptics -Dictionary" (UKACD), the list of signature words from the YAWL package, -and the 10,196 places list from the MWords package. - -The ENABLE package, mainted by M\Cooper <thegrendel@theriver.com>, -is in the Public Domain: - - The ENABLE master word list, WORD.LST, is herewith formally released - into the Public Domain. Anyone is free to use it or distribute it in - any manner they see fit. No fee or registration is required for its - use nor are "contributions" solicited (if you feel you absolutely - must contribute something for your own peace of mind, the authors of - the ENABLE list ask that you make a donation on their behalf to your - favorite charity). This word list is our gift to the Scrabble - community, as an alternate to "official" word lists. Game designers - may feel free to incorporate the WORD.LST into their games. Please - mention the source and credit us as originators of the list. Note - that if you, as a game designer, use the WORD.LST in your product, - you may still copyright and protect your product, but you may *not* - legally copyright or in any way restrict redistribution of the - WORD.LST portion of your product. This *may* under law restrict your - rights to restrict your users' rights, but that is only fair. - -UKACD, by J Ross Beresford <ross@bryson.demon.co.uk>, is under the -following copyright: - - Copyright (c) J Ross Beresford 1993-1999. All Rights Reserved. - - The following restriction is placed on the use of this publication: - if The UK Advanced Cryptics Dictionary is used in a software package - or redistributed in any form, the copyright notice must be - prominently displayed and the text of this document must be included - verbatim. - - There are no other restrictions: I would like to see the list - distributed as widely as possible. - -The 95 level includes the 354,984 single words, 256,772 compound -words, 4,946 female names and the 3,897 male names, and 21,986 names -from the MWords package, ABLE.LST from the ENABLE Supplement, and some -additional words found in my part-of-speech database that were not -found anywhere else. - -Accent information was taken from UKACD. - -My VARCON package was used to create the American, British, and -Canadian word list. - -Since the original word lists used in the VARCON package came -from the Ispell distribution they are under the Ispell copyright: - - Copyright 1993, Geoff Kuenning, Granada Hills, CA - All rights reserved. - - Redistribution and use in source and binary forms, with or without - modification, are permitted provided that the following conditions - are met: - - 1. Redistributions of source code must retain the above copyright - notice, this list of conditions and the following disclaimer. - 2. Redistributions in binary form must reproduce the above copyright - notice, this list of conditions and the following disclaimer in the - documentation and/or other materials provided with the distribution. - 3. All modifications to the source code must be clearly marked as - such. Binary redistributions based on modified source code - must be clearly marked as modified versions in the documentation - and/or other materials provided with the distribution. - (clause 4 removed with permission from Geoff Kuenning) - 5. The name of Geoff Kuenning may not be used to endorse or promote - products derived from this software without specific prior - written permission. - - THIS SOFTWARE IS PROVIDED BY GEOFF KUENNING AND CONTRIBUTORS ``AS - IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT - LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS - FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL GEOFF - KUENNING OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, - INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, - BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; - LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER - CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT - LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN - ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE - POSSIBILITY OF SUCH DAMAGE. diff --git a/lib/Ninka/FileCleaner.pm b/lib/Ninka/FileCleaner.pm index c3dd912..825b1fb 100644 --- a/lib/Ninka/FileCleaner.pm +++ b/lib/Ninka/FileCleaner.pm @@ -49,19 +49,19 @@ Escapes apostrophes and other potentially disturbing characters =head1 COPYRIGHT AND LICENSE - Copyright (C) 2009-2014 Yuki Manabe and Daniel M. German, 2015 Daniele Fognini and Johannes Najjar +Copyright (C) 2009-2014 Yuki Manabe and Daniel M. German, 2015 Daniele Fognini and Johannes Najjar - This program is free software: you can redistribute it and/or modify - it under the terms of the GNU General Public License as - published by the Free Software Foundation; either version 2 of the - License, or (at your option) any later version. +This program is free software: you can redistribute it and/or modify +it under the terms of the GNU General Public License as +published by the Free Software Foundation; either version 2 of the +License, or (at your option) any later version. - This program is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - GNU General Public License for more details. +This program is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +GNU General Public License for more details. - You should have received a copy of the GNU General Public License - along with this program. If not, see <http://www.gnu.org/licenses/>. +You should have received a copy of the GNU General Public License +along with this program. If not, see <http://www.gnu.org/licenses/>. -=cut
\ No newline at end of file +=cut diff --git a/lib/Ninka/LicenseMatcher.pm b/lib/Ninka/LicenseMatcher.pm index 1cb402a..ba73b26 100644 --- a/lib/Ninka/LicenseMatcher.pm +++ b/lib/Ninka/LicenseMatcher.pm @@ -261,19 +261,19 @@ Uses a set of license sentence names as input and outputs license names correspo =head1 COPYRIGHT AND LICENSE - Copyright (C) 2009-2014 Yuki Manabe and Daniel M. German +Copyright (C) 2009-2014 Yuki Manabe and Daniel M. German - This program is free software: you can redistribute it and/or modify - it under the terms of the GNU General Public License as - published by the Free Software Foundation; either version 2 of the - License, or (at your option) any later version. +This program is free software: you can redistribute it and/or modify +it under the terms of the GNU General Public License as +published by the Free Software Foundation; either version 2 of the +License, or (at your option) any later version. - This program is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - GNU General Public License for more details. +This program is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +GNU General Public License for more details. - You should have received a copy of the GNU General Public License - along with this program. If not, see <http://www.gnu.org/licenses/>. +You should have received a copy of the GNU General Public License +along with this program. If not, see <http://www.gnu.org/licenses/>. =cut diff --git a/lib/Ninka/LicenseRules.pm b/lib/Ninka/LicenseRules.pm index c7810c8..ee5af4b 100644 --- a/lib/Ninka/LicenseRules.pm +++ b/lib/Ninka/LicenseRules.pm @@ -96,19 +96,19 @@ Contains rules used by Ninka::LicenseMatcher. =head1 COPYRIGHT AND LICENSE - Copyright (C) 2009-2014 Yuki Manabe and Daniel M. German +Copyright (C) 2009-2014 Yuki Manabe and Daniel M. German - This program is free software: you can redistribute it and/or modify - it under the terms of the GNU General Public License as - published by the Free Software Foundation; either version 2 of the - License, or (at your option) any later version. +This program is free software: you can redistribute it and/or modify +it under the terms of the GNU General Public License as +published by the Free Software Foundation; either version 2 of the +License, or (at your option) any later version. - This program is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - GNU General Public License for more details. +This program is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +GNU General Public License for more details. - You should have received a copy of the GNU General Public License - along with this program. If not, see <http://www.gnu.org/licenses/>. +You should have received a copy of the GNU General Public License +along with this program. If not, see <http://www.gnu.org/licenses/>. =cut diff --git a/lib/Ninka/README.txt b/lib/Ninka/README.txt deleted file mode 100644 index 2ca7f46..0000000 --- a/lib/Ninka/README.txt +++ /dev/null @@ -1,9 +0,0 @@ -This list of abbreviations was extracted from SCOWL (Spell Checker Oriented Word Lists) by by Kevin Atkinson (kevina@gnu.org) version 2015.04.24. - -Specifically it was created from scowl-2015.04.24.tar.gz. by running: - -cat *abbrev* | sort -u > abbreviations.dict - -It also contains some additions by D.M German. - -See Copyright.scowl for license. diff --git a/lib/Ninka/SentenceExtractor.pm b/lib/Ninka/SentenceExtractor.pm index c27d199..6aeee4e 100644 --- a/lib/Ninka/SentenceExtractor.pm +++ b/lib/Ninka/SentenceExtractor.pm @@ -93,7 +93,7 @@ sub execute { $count2++ if ($c ge 'A' && $c le 'z'); } my $clean_sentence = clean_sentence($sentence); - push @clean_sentences, $clean_sentence if $clean_sentence, + push @clean_sentences, $clean_sentence if $clean_sentence; } if ($count1 != $count2) { @@ -251,6 +251,19 @@ Ninka::SentenceExtractor Breaks comments into sentences. +=head1 NOTES + +This list of abbreviations was extracted from SCOWL (Spell Checker Oriented Word Lists) +by Kevin Atkinson (kevina@gnu.org) version 2015.04.24. + +Specifically it was created from scowl-2015.04.24.tar.gz. by running: + + cat *abbrev* | sort -u > abbreviations.dict + +It also contains some additions by D.M German. + +See Copyright.SCOWL for license. + =head1 COPYRIGHT AND LICENSE Author: Paul Clough |