python source code of porter

Project: razzy-spinner (GitHub Link)

razzy-spinner-master
- demo
  - index.php
  - proccess_spin.php
  - assets
    - img
    - fonts
      - roboto
        Roboto-Bold.eot
        Roboto-Regular.ttf
        Roboto-Medium.ttf
        Roboto-Bold.woff
        Roboto-Light.woff
        Roboto-Thin.woff
        Roboto-Light.ttf
        Roboto-Light.eot
        Roboto-Medium.woff2
        Roboto-Thin.eot
        Roboto-Thin.ttf
        Roboto-Medium.woff
        Roboto-Regular.woff2
        Roboto-Regular.woff
        Roboto-Bold.woff2
        Roboto-Regular.eot
        Roboto-Bold.ttf
        Roboto-Medium.eot
        Roboto-Thin.woff2
        Roboto-Light.woff2
    - js
      - inputTags.jquery.min.js
      - inputTags.jquery.js
      - LICENSE
      - materialize.min.js
      - app.js
      - jquery.blockUI.js
      - README.md
      - sweetalert2.min.js
    - font
      - material-design-icons
        Material-Design-Icons.woff
        Material-Design-Icons.woff2
        Material-Design-Icons.ttf
        Material-Design-Icons.eot
        LICENSE.txt
      - roboto
        Roboto-Bold.eot
        Roboto-Regular.ttf
        Roboto-Medium.ttf
        Roboto-Bold.woff
        Roboto-Light.woff
        Roboto-Thin.woff
        Roboto-Light.ttf
        Roboto-Light.eot
        Roboto-Medium.woff2
        Roboto-Thin.eot
        Roboto-Thin.ttf
        Roboto-Medium.woff
        Roboto-Regular.woff2
        Roboto-Regular.woff
        Roboto-Bold.woff2
        Roboto-Regular.eot
        Roboto-Bold.ttf
        Roboto-Medium.eot
        Roboto-Thin.woff2
        Roboto-Light.woff2
    - css
      - inputTags.min.css
      - inputTags.css
      - materialize.min.css
      - materialize.css
      - inputTags.less
      - sweetalert2.min.css
- LICENSE
- autoload.php
- README.md
- core
  - resources
    - lang
  - libs
    - razzy
      - therausus.php
  - classes
    - pos_tagger.class.php
    - cache.class.php
    - spinner.class.php
    - lang.class.php
    - functions.class.php
  - composer.lock
  - snippets
    - countries.php
    - stopwords.php
  - vendor
    - icanboogie
      - inflector
        LICENSE
        lib
        inflector.php
        inflections.php
        inflections
        tr.php
        nb.php
        fr.php
        es.php
        en.php
        pt.php
        helpers.php
        composer.json
        README.md
    - composer
      - autoload_classmap.php
      - LICENSE
      - ClassLoader.php
      - autoload_psr4.php
      - autoload_files.php
      - autoload_real.php
      - autoload_namespaces.php
      - installed.json
    - autoload.php
    - fire015
      - flintstone
        src
        Exception.php
        Cache
        CacheInterface.php
        ArrayCache.php
        Flintstone.php
        Database.php
        Formatter
        SerializeFormatter.php
        JsonFormatter.php
        FormatterInterface.php
        Config.php
        phpunit.xml.dist
        UPGRADE.md
        CHANGELOG.md
        composer.json
        LICENSE.md
        .travis.yml
        README.md
        tests
        ConfigTest.php
        FlintstoneTest.php
        DatabaseTest.php
        .gitignore
  - composer.json
  - bin
    - python
      - en
        numeral.pyc
        commonsense.pyc
        commonsense.py
        rid.py
        quantify.py
        ogden
        __init__.pyc
        __init__.py
        ogden_2000.txt
        tags.pyc
        ordinal.pyc
        article.py
        singular.pyc
        __init__.pyc
        rid.pyc
        article.pyc
        quantify.pyc
        verb
        __init__.pyc
        __init__.py
        singular.py
        tags.py
        __init__.py
        wordnet
        wntools.py
        wordnet2
        compile
        src
        tkAppInit.c
        Makefile.in
        wnb
        stubs.c
        wn.c
        Makefile.am
        ChangeLog
        AUTHORS
        NEWS
        Makefile.in
        include
        wngrind.h
        Makefile
        Makefile.in
        Makefile.am
        wn.h
        acinclude.m4
        INSTALL
        README
        lib
        Makefile.in
        wnhelp.c
        binsrch.c
        wnrtl.c
        search.c
        morph.c
        wnutil.c
        wnres
        license.txt
        Makefile.in
        wngloss.man
        Makefile.am
        wnb.man
        wn.xbm
        Makefile.am
        wnglobal.c
        configure
        COPYING
        configure.ac
        aclocal.m4
        missing
        Makefile.am
        config.h.in
        dict
        adj.exc
        Makefile
        index.adv
        Makefile.in
        noun.exc
        sentidx.vrb
        adv.exc
        sents.vrb
        frames.vrb
        verb.Framestext
        lexnames
        Makefile.am
        verb.exc
        log.grind.2.1
        install-sh
        depcomp
        doc
        pdf
        Makefile
        Makefile.in
        Makefile.am
        Makefile
        Makefile.in
        html
        binsrch.3WN.html
        wnintro.1WN.html
        wnsearch.3WN.html
        wnintro.3WN.html
        Makefile
        wndb.5WN.html
        Makefile.in
        wnlicens.7WN.html
        grind.1WN.html
        lexnames.5WN.html
        wnpkgs.7WN.html
        cntlist.5WN.html
        senseidx.5WN.html
        wn.1WN.html
        wnintro.7WN.html
        morphy.7WN.html
        wnutil.3WN.html
        wngroups.7WN.html
        wnstats.7WN.html
        uniqbeg.7WN.html
        Makefile.am
        wnb.1WN.html
        wninput.5WN.html
        wnintro.5WN.html
        morph.3WN.html
        wngloss.7WN.html
        Makefile.am
        man
        wninput.5
        wnintro.5
        grind.1
        Makefile
        wnlicens.7
        Makefile.in
        morphy.7
        wnutil.3
        wn.1
        wnstats.7
        wnintro.1
        wnintro.7
        senseidx.5
        wndb.5
        wnintro.3
        binsrch.3
        wngloss.7
        lexnames.5
        wnpkgs.7
        Makefile.am
        morph.3
        wnb.1
        wnsearch.3
        wngroups.7
        uniqbeg.7
        cntlist.5
        ps
        wnstats.7.ps
        cntlist.5.ps
        Makefile
        wnlicens.7.ps
        Makefile.in
        uniqbeg.7.ps
        wnintro.1.ps
        grind.1.ps
        wndb.5.ps
        wngroups.7.ps
        wnutil.3.ps
        wnpkgs.7.ps
        wnintro.5.ps
        wngloss.7.ps
        wn.1.ps
        wnintro.7.ps
        wnb.1.ps
        Makefile.am
        morph.3.ps
        wninput.5.ps
        wnsearch.3.ps
        senseidx.5.ps
        lexnames.5.ps
        wnintro.3.ps
        binsrch.3.ps
        morphy.7.ps
        concordance.py
        __init__.pyc
        README.txt
        wordnet.pyc
        docsrc
        index.xml
        build.xml
        download.xml
        styles.in.css
        release-notes.xml
        contributors.xml
        requirements.xml
        publish.xsl
        contributors-src.xml
        format-contributors.xsl
        schemas.xml
        install.xml
        license.xml
        make-navigation.xsl
        examples.xml
        make-css-prefix.xsl
        setup.py
        PKG-INFO
        wntools.pyc
        __init__.py
        docs
        installation.html
        contents.html
        styles.css
        nav.html.inc
        contributors.html
        styles.css.prefix
        release-notes.html
        index.html
        examples.html
        license.html
        download.html
        LICENSE.txt
        wordnet.py
        spelling
        __init__.pyc
        __init__.py
        plural.py
        ordinal.py
        numeral.py
        _en-test.py
        LICENSE.txt
        plural.pyc
        parser
        __init__.pyc
        __init__.py
        nltk_lite
        draw
        srparser.py
        rdparser.py
        plot.py
        chart.py
        __init__.py
        tree.py
        cfg.py
        dispersion.py
        probability.pyc
        utilities.py
        semantics
        utilities.py
        evaluate.py
        logic.py
        __init__.py
        evaluate.py
        corpora
        toolbox.py
        ieer.py
        words.py
        ppattach.py
        timit.py
        conll2000.py
        ycoe.py
        state_union.py
        inaugural.py
        treebank.py
        stopwords.py
        senseval.py
        brown.py
        cmudict.py
        __init__.py
        genesis.py
        names.py
        gutenberg.py
        sinica_treebank.py
        chat
        zen.py
        eliza.py
        rude.py
        iesha.py
        __init__.py
        tag
        hmm.py
        unigram.py
        brill.py
        ngram.py
        __init__.py
        test
        doctest_driver.py
        __init__.py
        probability.py
        stem
        regexp.py
        __init__.py
        porter.py
        parse
        treetransforms.py
        rd.pyc
        featurestructure.pyc
        chunk.pyc
        grammarfile.py
        viterbi.py
        viterbi.pyc
        pchart.py
        cfg.pyc
        chart.pyc
        category.py
        chunk.py
        sr.pyc
        sr.py
        featurechart.py
        __init__.pyc
        tree.pyc
        generate.py
        chart.py
        rd.py
        featurestructure.py
        __init__.py
        tree.py
        pcfg.py
        pcfg.pyc
        cfg.py
        __init__.pyc
        README.txt
        etree
        ElementPath.py
        __init__.py
        ElementInclude.py
        ElementTree.py
        misc
        wordfinder.py
        __init__.py
        sort.py
        LICENSE.TXT
        setup.py
        PKG-INFO
        __init__.py
        wordnet
        wntools.py
        concordance.py
        __init__.py
        wordnet.py
        tokenize
        regexp.py
        simple.pyc
        simple.py
        __init__.pyc
        regexp.pyc
        __init__.py
        model
        __init__.py
        cluster
        gaac.py
        em.py
        __init__.py
        kmeans.py
        contrib
        paradigmquery.py
        hole.py
        combined.py
        featurelite.py
        toolbox
        data.py
        utilities.py
        text.py
        lexicon.py
        __init__.py
        settings.py
        errors.py
        kimmo.py
        __init__.py
        lambda.py
        fsa.py
        featuredemo.py
        marshal.py
        paradigm.py
        marshalbrill.py
        concord.py
        INSTALL.TXT
        Brill_license.txt
      - nltk_core.pyc
      - convert_tense.py
      - __pycache__
        nltk_core.cpython-34.pyc
      - pos_tagger.py
      - nltk
        classify
        util.py
        svm.pyc
        weka.pyc
        rte_classify.py
        decisiontree.py
        __pycache__
        senna.cpython-34.pyc
        tadm.cpython-34.pyc
        maxent.cpython-34.pyc
        textcat.cpython-34.pyc
        megam.cpython-34.pyc
        rte_classify.cpython-34.pyc
        decisiontree.cpython-34.pyc
        weka.cpython-34.pyc
        positivenaivebayes.cpython-34.pyc
        naivebayes.cpython-34.pyc
        scikitlearn.cpython-34.pyc
        api.cpython-34.pyc
        util.cpython-34.pyc
        __init__.cpython-34.pyc
        senna.pyc
        weka.py
        naivebayes.pyc
        positivenaivebayes.pyc
        util.pyc
        __init__.pyc
        textcat.py
        senna.py
        textcat.pyc
        scikitlearn.pyc
        maxent.py
        tadm.pyc
        maxent.pyc
        naivebayes.py
        api.py
        api.pyc
        rte_classify.pyc
        megam.py
        __init__.py
        tadm.py
        svm.py
        decisiontree.pyc
        megam.pyc
        positivenaivebayes.py
        scikitlearn.py
        data.py
        treetransforms.py
        draw
        util.py
        __pycache__
        dispersion.cpython-34.pyc
        tree.cpython-34.pyc
        cfg.cpython-34.pyc
        table.cpython-34.pyc
        util.cpython-34.pyc
        __init__.cpython-34.pyc
        cfg.pyc
        table.py
        util.pyc
        __init__.pyc
        tree.pyc
        __init__.py
        tree.py
        cfg.py
        dispersion.pyc
        dispersion.py
        table.pyc
        toolbox.py
        probability.pyc
        decorators.py
        tgrep.py
        util.py
        decorators.pyc
        lazyimport.py
        featstruct.py
        book.py
        help.pyc
        text.py
        __pycache__
        featstruct.cpython-34.pyc
        decorators.cpython-34.pyc
        grammar.cpython-34.pyc
        tree.cpython-34.pyc
        probability.cpython-34.pyc
        help.cpython-34.pyc
        text.cpython-34.pyc
        compat.cpython-34.pyc
        internals.cpython-34.pyc
        jsontags.cpython-34.pyc
        treetransforms.cpython-34.pyc
        data.cpython-34.pyc
        downloader.cpython-34.pyc
        wsd.cpython-34.pyc
        toolbox.cpython-34.pyc
        util.cpython-34.pyc
        six.cpython-34.pyc
        lazyimport.cpython-34.pyc
        __init__.cpython-34.pyc
        collocations.cpython-34.pyc
        internals.py
        jsontags.py
        collocations.py
        wsd.pyc
        twitter
        util.py
        twitterclient.pyc
        util.pyc
        __init__.pyc
        twitter_demo.py
        api.py
        api.pyc
        twitterclient.py
        common.py
        __init__.py
        common.pyc
        twitter_demo.pyc
        six.py
        translate
        ibm5.pyc
        gdfa.py
        ibm_model.pyc
        gdfa.pyc
        ibm5.py
        stack_decoder.py
        __pycache__
        ibm1.cpython-34.pyc
        ibm_model.cpython-34.pyc
        ibm4.cpython-34.pyc
        ibm5.cpython-34.pyc
        ibm2.cpython-34.pyc
        bleu_score.cpython-34.pyc
        metrics.cpython-34.pyc
        api.cpython-34.pyc
        stack_decoder.cpython-34.pyc
        ibm3.cpython-34.pyc
        __init__.cpython-34.pyc
        ibm1.pyc
        ibm3.py
        phrase_based.pyc
        metrics.py
        ibm_model.py
        ibm2.py
        ibm3.pyc
        gale_church.pyc
        ibm1.py
        __init__.pyc
        ibm4.py
        api.py
        api.pyc
        ibm2.pyc
        gale_church.py
        __init__.py
        metrics.pyc
        bleu_score.pyc
        phrase_based.py
        ibm4.pyc
        stack_decoder.pyc
        bleu_score.py
        corpus
        util.py
        __pycache__
        util.cpython-34.pyc
        __init__.cpython-34.pyc
        util.pyc
        __init__.pyc
        europarl_raw.py
        europarl_raw.pyc
        __init__.py
        reader
        wordlist.py
        toolbox.py
        opinion_lexicon.py
        ieer.py
        tagged.pyc
        chasen.py
        util.py
        indian.pyc
        lin.pyc
        cmudict.pyc
        ppattach.py
        timit.py
        nps_chat.py
        pl196x.pyc
        verbnet.py
        udhr.pyc
        ycoe.py
        nps_chat.pyc
        __pycache__
        conll.cpython-34.pyc
        xmldocs.cpython-34.pyc
        semcor.cpython-34.pyc
        timit.cpython-34.pyc
        verbnet.cpython-34.pyc
        sinica_treebank.cpython-34.pyc
        plaintext.cpython-34.pyc
        senseval.cpython-34.pyc
        nps_chat.cpython-34.pyc
        sentiwordnet.cpython-34.pyc
        nkjp.cpython-34.pyc
        rte.cpython-34.pyc
        comparative_sents.cpython-34.pyc
        bracket_parse.cpython-34.pyc
        categorized_sents.cpython-34.pyc
        childes.cpython-34.pyc
        twitter.cpython-34.pyc
        cmudict.cpython-34.pyc
        knbc.cpython-34.pyc
        chunked.cpython-34.pyc
        ieer.cpython-34.pyc
        opinion_lexicon.cpython-34.pyc
        mte.cpython-34.pyc
        propbank.cpython-34.pyc
        crubadan.cpython-34.pyc
        pl196x.cpython-34.pyc
        wordnet.cpython-34.pyc
        ppattach.cpython-34.pyc
        ycoe.cpython-34.pyc
        nombank.cpython-34.pyc
        udhr.cpython-34.pyc
        indian.cpython-34.pyc
        switchboard.cpython-34.pyc
        tagged.cpython-34.pyc
        chasen.cpython-34.pyc
        string_category.cpython-34.pyc
        ipipan.cpython-34.pyc
        wordlist.cpython-34.pyc
        bnc.cpython-34.pyc
        toolbox.cpython-34.pyc
        pros_cons.cpython-34.pyc
        aligned.cpython-34.pyc
        api.cpython-34.pyc
        util.cpython-34.pyc
        reviews.cpython-34.pyc
        lin.cpython-34.pyc
        framenet.cpython-34.pyc
        __init__.cpython-34.pyc
        dependency.cpython-34.pyc
        string_category.py
        plaintext.pyc
        lin.py
        comparative_sents.pyc
        ieer.pyc
        bnc.py
        semcor.py
        framenet.py
        rte.pyc
        xmldocs.py
        switchboard.pyc
        ipipan.py
        indian.py
        toolbox.pyc
        mte.py
        util.pyc
        propbank.pyc
        __init__.pyc
        wordnet.pyc
        wordlist.pyc
        sinica_treebank.pyc
        chunked.py
        rte.py
        dependency.pyc
        mte.pyc
        switchboard.py
        conll.py
        bracket_parse.pyc
        bnc.pyc
        categorized_sents.py
        nombank.py
        childes.py
        senseval.py
        crubadan.pyc
        bracket_parse.py
        api.py
        reviews.py
        knbc.py
        plaintext.py
        api.pyc
        timit.pyc
        string_category.pyc
        nkjp.pyc
        cmudict.py
        twitter.py
        opinion_lexicon.pyc
        crubadan.py
        __init__.py
        chasen.pyc
        verbnet.pyc
        knbc.pyc
        nombank.pyc
        ppattach.pyc
        sentiwordnet.pyc
        conll.pyc
        pros_cons.py
        sinica_treebank.py
        pros_cons.pyc
        comparative_sents.py
        nkjp.py
        aligned.py
        ipipan.pyc
        senseval.pyc
        sentiwordnet.py
        childes.pyc
        semcor.pyc
        propbank.py
        reviews.pyc
        framenet.pyc
        aligned.pyc
        udhr.py
        dependency.py
        pl196x.py
        tagged.py
        chunked.pyc
        twitter.pyc
        ycoe.pyc
        xmldocs.pyc
        wordnet.py
        categorized_sents.pyc
        chat
        zen.py
        zen.pyc
        util.py
        suntsu.py
        eliza.py
        rude.py
        util.pyc
        __init__.pyc
        suntsu.pyc
        iesha.py
        iesha.pyc
        rude.pyc
        __init__.py
        eliza.pyc
        tag
        crf.py
        perceptron.py
        brill_trainer.py
        hmm.pyc
        hunpos.pyc
        hmm.py
        util.py
        sequential.py
        __pycache__
        stanford.cpython-34.pyc
        senna.cpython-34.pyc
        crf.cpython-34.pyc
        perceptron.cpython-34.pyc
        brill.cpython-34.pyc
        brill_trainer.cpython-34.pyc
        tnt.cpython-34.pyc
        mapping.cpython-34.pyc
        sequential.cpython-34.pyc
        api.cpython-34.pyc
        util.cpython-34.pyc
        hunpos.cpython-34.pyc
        hmm.cpython-34.pyc
        __init__.cpython-34.pyc
        mapping.py
        senna.pyc
        crf.pyc
        util.pyc
        __init__.pyc
        stanford.pyc
        senna.py
        mapping.pyc
        api.py
        api.pyc
        brill.py
        tnt.py
        __init__.py
        hunpos.py
        tnt.pyc
        stanford.py
        sequential.pyc
        brill_trainer.pyc
        perceptron.pyc
        brill.pyc
        test
        childes_fixt.py
        gluesemantics_malt_fixt.pyc
        parse.doctest
        util.doctest
        compat_fixt.pyc
        childes_fixt.pyc
        classify_fixt.pyc
        bleu.doctest
        semantics_fixt.py
        dependency.doctest
        tree.doctest
        sentiwordnet.doctest
        nonmonotonic_fixt.pyc
        wordnet_fixt.py
        gluesemantics_malt.doctest
        discourse.doctest
        portuguese_en.doctest
        generate.doctest
        grammartestsuites.doctest
        translate.doctest
        resolution.doctest
        stem.doctest
        probability.doctest
        wsd.doctest
        paice.doctest
        ccg.doctest
        childes.doctest
        inference.doctest
        tag.doctest
        metrics.doctest
        gluesemantics_malt_fixt.py
        collocations.doctest
        index.doctest
        bnc.doctest
        segmentation_fixt.pyc
        semantics.doctest
        portuguese_en_fixt.pyc
        nonmonotonic.doctest
        __init__.pyc
        toolbox.doctest
        tokenize.doctest
        wordnet_fixt.pyc
        featgram.doctest
        sentiment.doctest
        grammar.doctest
        portuguese_en_fixt.py
        classify_fixt.py
        chunk.doctest
        compat_fixt.py
        treetransforms.doctest
        segmentation_fixt.py
        gensim_fixt.py
        drt.doctest
        japanese.doctest
        framenet.doctest
        gensim.doctest
        crubadan.doctest
        discourse_fixt.pyc
        inference_fixt.pyc
        translate_fixt.pyc
        runtests.py
        doctest_nose_plugin.py
        discourse_fixt.py
        compat.doctest
        __init__.py
        chat80.doctest
        probability_fixt.py
        propbank.doctest
        corpus.doctest
        translate_fixt.py
        semantics_fixt.pyc
        relextract.doctest
        wordnet.doctest
        runtests.pyc
        probability_fixt.pyc
        corpus_fixt.pyc
        gensim_fixt.pyc
        inference_fixt.py
        wordnet_lch.doctest
        corpus_fixt.py
        nonmonotonic_fixt.py
        unit
        test_tgrep.pyc
        test_seekable_unicode_stream_reader.py
        test_json2csv_corpus.py
        test_hmm.pyc
        test_collocations.pyc
        test_stem.py
        test_hmm.py
        test_corpus_views.pyc
        translate
        test_ibm1.pyc
        test_ibm4.pyc
        test_bleu.py
        test_ibm5.pyc
        test_ibm2.pyc
        test_ibm3.py
        __init__.pyc
        test_ibm4.py
        test_stack_decoder.pyc
        test_ibm3.pyc
        test_ibm1.py
        test_ibm_model.py
        test_stack_decoder.py
        test_bleu.pyc
        test_ibm5.py
        __init__.py
        test_ibm_model.pyc
        test_ibm2.py
        test_seekable_unicode_stream_reader.pyc
        test_tag.pyc
        test_stem.pyc
        test_twitter_auth.pyc
        __init__.pyc
        test_tgrep.py
        test_classify.py
        test_2x_compat.py
        test_classify.pyc
        test_naivebayes.pyc
        __init__.py
        utils.py
        test_naivebayes.py
        test_corpus_views.py
        test_corpora.pyc
        test_2x_compat.pyc
        test_twitter_auth.py
        utils.pyc
        test_tag.py
        test_corpora.py
        test_json2csv_corpus.pyc
        test_collocations.py
        all.py
        data.doctest
        logic.doctest
        treeprettyprinter.doctest
        simple.doctest
        classify.doctest
        all.pyc
        featstruct.doctest
        internals.doctest
        misc.doctest
        gluesemantics.doctest
        doctest_nose_plugin.pyc
        probability.py
        stem
        snowball.py
        regexp.py
        util.py
        __pycache__
        lancaster.cpython-34.pyc
        snowball.cpython-34.pyc
        rslp.cpython-34.pyc
        porter.cpython-34.pyc
        regexp.cpython-34.pyc
        wordnet.cpython-34.pyc
        isri.cpython-34.pyc
        api.cpython-34.pyc
        util.cpython-34.pyc
        __init__.cpython-34.pyc
        rslp.py
        lancaster.pyc
        util.pyc
        __init__.pyc
        wordnet.pyc
        snowball.pyc
        porter.pyc
        isri.pyc
        api.py
        api.pyc
        rslp.pyc
        regexp.pyc
        __init__.py
        lancaster.py
        isri.py
        porter.py
        wordnet.py
        parse
        projectivedependencyparser.pyc
        earleychart.py
        util.py
        viterbi.py
        viterbi.pyc
        shiftreduce.py
        pchart.py
        recursivedescent.pyc
        __pycache__
        shiftreduce.cpython-34.pyc
        dependencygraph.cpython-34.pyc
        pchart.cpython-34.pyc
        transitionparser.cpython-34.pyc
        earleychart.cpython-34.pyc
        bllip.cpython-34.pyc
        projectivedependencyparser.cpython-34.pyc
        viterbi.cpython-34.pyc
        malt.cpython-34.pyc
        nonprojectivedependencyparser.cpython-34.pyc
        recursivedescent.cpython-34.pyc
        chart.cpython-34.pyc
        featurechart.cpython-34.pyc
        api.cpython-34.pyc
        util.cpython-34.pyc
        evaluate.cpython-34.pyc
        __init__.cpython-34.pyc
        evaluate.py
        dependencygraph.py
        nonprojectivedependencyparser.py
        nonprojectivedependencyparser.pyc
        bllip.py
        transitionparser.py
        chart.pyc
        evaluate.pyc
        generate.pyc
        earleychart.pyc
        featurechart.py
        util.pyc
        recursivedescent.py
        __init__.pyc
        projectivedependencyparser.py
        stanford.pyc
        shiftreduce.pyc
        generate.py
        chart.py
        api.py
        transitionparser.pyc
        api.pyc
        bllip.pyc
        dependencygraph.pyc
        __init__.py
        malt.py
        stanford.py
        pchart.pyc
        featurechart.pyc
        malt.pyc
        six.pyc
        toolbox.pyc
        treeprettyprinter.py
        util.pyc
        __init__.pyc
        tree.pyc
        misc
        minimalset.py
        wordfinder.py
        __pycache__
        minimalset.cpython-34.pyc
        chomsky.cpython-34.pyc
        babelfish.cpython-34.pyc
        wordfinder.cpython-34.pyc
        __init__.cpython-34.pyc
        chomsky.pyc
        sort.pyc
        babelfish.py
        minimalset.pyc
        babelfish.pyc
        __init__.pyc
        chomsky.py
        __init__.py
        wordfinder.pyc
        sort.py
        data.pyc
        featstruct.pyc
        treetransforms.pyc
        sem
        linearlogic.pyc
        drt_glue_demo.py
        util.py
        glue.py
        cooper_storage.py
        __pycache__
        glue.cpython-34.pyc
        linearlogic.cpython-34.pyc
        boxer.cpython-34.pyc
        lfg.cpython-34.pyc
        drt.cpython-34.pyc
        relextract.cpython-34.pyc
        skolemize.cpython-34.pyc
        logic.cpython-34.pyc
        util.cpython-34.pyc
        evaluate.cpython-34.pyc
        __init__.cpython-34.pyc
        evaluate.py
        glue.pyc
        logic.py
        chat80.py
        logic.pyc
        relextract.py
        linearlogic.py
        evaluate.pyc
        hole.py
        hole.pyc
        drt_glue_demo.pyc
        util.pyc
        boxer.pyc
        __init__.pyc
        lfg.py
        lfg.pyc
        skolemize.py
        __init__.py
        cooper_storage.pyc
        drt.py
        drt.pyc
        skolemize.pyc
        boxer.py
        chat80.pyc
        relextract.pyc
        downloader.py
        grammar.pyc
        jsontags.pyc
        text.pyc
        tbl
        rule.pyc
        erroranalysis.py
        erroranalysis.pyc
        __pycache__
        template.cpython-34.pyc
        feature.cpython-34.pyc
        erroranalysis.cpython-34.pyc
        rule.cpython-34.pyc
        __init__.cpython-34.pyc
        template.pyc
        demo.py
        __init__.pyc
        demo.pyc
        template.py
        rule.py
        api.py
        api.pyc
        feature.pyc
        __init__.py
        feature.py
        sentiment
        sentiment_analyzer.pyc
        util.py
        util.pyc
        sentiment_analyzer.py
        __init__.pyc
        vader.pyc
        __init__.py
        vader.py
        internals.pyc
        collocations.pyc
        lazyimport.pyc
        grammar.py
        VERSION
        tgrep.pyc
        __init__.py
        wsd.py
        chunk
        regexp.py
        util.py
        named_entity.pyc
        __pycache__
        regexp.cpython-34.pyc
        api.cpython-34.pyc
        util.cpython-34.pyc
        __init__.cpython-34.pyc
        named_entity.py
        util.pyc
        __init__.pyc
        api.py
        api.pyc
        regexp.pyc
        __init__.py
        tokenize
        punkt.py
        regexp.py
        util.py
        simple.pyc
        simple.py
        punkt.pyc
        treebank.pyc
        sexpr.pyc
        __pycache__
        stanford.cpython-34.pyc
        mwe.cpython-34.pyc
        simple.cpython-34.pyc
        texttiling.cpython-34.pyc
        regexp.cpython-34.pyc
        treebank.cpython-34.pyc
        punkt.cpython-34.pyc
        sexpr.cpython-34.pyc
        casual.cpython-34.pyc
        api.cpython-34.pyc
        util.cpython-34.pyc
        __init__.cpython-34.pyc
        util.pyc
        __init__.pyc
        stanford.pyc
        mwe.pyc
        treebank.py
        api.py
        api.pyc
        regexp.pyc
        texttiling.py
        __init__.py
        mwe.py
        stanford.py
        texttiling.pyc
        casual.py
        casual.pyc
        sexpr.py
        help.py
        tree.py
        compat.pyc
        book.pyc
        inference
        resolution.pyc
        nonmonotonic.py
        __pycache__
        tableau.cpython-34.pyc
        prover9.cpython-34.pyc
        resolution.cpython-34.pyc
        mace.cpython-34.pyc
        discourse.cpython-34.pyc
        api.cpython-34.pyc
        __init__.cpython-34.pyc
        nonmonotonic.pyc
        tableau.pyc
        prover9.pyc
        discourse.pyc
        __init__.pyc
        api.py
        api.pyc
        mace.pyc
        mace.py
        __init__.py
        discourse.py
        prover9.py
        resolution.py
        tableau.py
        app
        rdparser_app.py
        concordance_app.pyc
        chunkparser_app.pyc
        collocations_app.pyc
        rdparser_app.pyc
        wordnet_app.py
        chartparser_app.pyc
        srparser_app.py
        nemo_app.py
        chunkparser_app.py
        __init__.pyc
        wordfreq_app.pyc
        nemo_app.pyc
        wordfreq_app.py
        chartparser_app.py
        srparser_app.pyc
        __init__.py
        concordance_app.py
        wordnet_app.pyc
        collocations_app.py
        metrics
        distance.pyc
        spearman.py
        __pycache__
        scores.cpython-34.pyc
        spearman.cpython-34.pyc
        paice.cpython-34.pyc
        confusionmatrix.cpython-34.pyc
        segmentation.cpython-34.pyc
        association.cpython-34.pyc
        distance.cpython-34.pyc
        agreement.cpython-34.pyc
        __init__.cpython-34.pyc
        scores.py
        agreement.pyc
        spearman.pyc
        paice.pyc
        agreement.py
        association.py
        __init__.pyc
        scores.pyc
        confusionmatrix.pyc
        segmentation.pyc
        association.pyc
        __init__.py
        segmentation.py
        distance.py
        paice.py
        confusionmatrix.py
        compat.py
        cluster
        util.py
        em.pyc
        gaac.py
        util.pyc
        __init__.pyc
        gaac.pyc
        em.py
        api.py
        api.pyc
        __init__.py
        kmeans.py
        kmeans.pyc
        downloader.pyc
        treeprettyprinter.pyc
        ccg
        __pycache__
        lexicon.cpython-34.pyc
        chart.cpython-34.pyc
        api.cpython-34.pyc
        combinator.cpython-34.pyc
        __init__.cpython-34.pyc
        chart.pyc
        combinator.py
        __init__.pyc
        chart.py
        lexicon.py
        api.py
        api.pyc
        __init__.py
        combinator.pyc
        lexicon.pyc
      - nltk_core.py
      - numeric_to_spoken.py
      - lemmatize.py

# Copyright (c) 2002 Vivake Gupta (vivakeATomniscia.org).  All rights reserved.
#
# This program is free software; you can redistribute it and/or
# modify it under the terms of the GNU General Public License as
# published by the Free Software Foundation; either version 2 of the
# License, or (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307
# USA
#
# This software is maintained by Vivake (vivakeATomniscia.org) and is available at:
#     http://www.omniscia.org/~vivake/python/PorterStemmer.py
#
# Additional modifications were made to incorporate this module into
# NLTK.  All such modifications are marked with "--NLTK--".  The NLTK
# version of this module is maintained by NLTK developers,
# and is available via http://nltk.org/
#
# GNU Linking Exception:
# Using this module statically or dynamically with other modules is
# making a combined work based on this module. Thus, the terms and
# conditions of the GNU General Public License cover the whole combination.
# As a special exception, the copyright holders of this module give
# you permission to combine this module with independent modules to
# produce an executable program, regardless of the license terms of these
# independent modules, and to copy and distribute the resulting
# program under terms of your choice, provided that you also meet,
# for each linked independent module, the terms and conditions of
# the license of that module. An independent module is a module which
# is not derived from or based on this module. If you modify this module,
# you may extend this exception to your version of the module, but you
# are not obliged to do so. If you do not wish to do so, delete this
# exception statement from your version.

"""
Porter Stemmer

This is the Porter stemming algorithm, ported to Python from the
version coded up in ANSI C by the author. It follows the algorithm
presented in

Porter, M. "An algorithm for suffix stripping." Program 14.3 (1980): 130-137.

only differing from it at the points marked --DEPARTURE-- and --NEW--
below.

For a more faithful version of the Porter algorithm, see

    http://www.tartarus.org/~martin/PorterStemmer/

Later additions:

   June 2000

   The 'l' of the 'logi' -> 'log' rule is put with the stem, so that
   short stems like 'geo' 'theo' etc work like 'archaeo' 'philo' etc.

   This follows a suggestion of Barry Wilkins, research student at
   Birmingham.


   February 2000

   the cvc test for not dropping final -e now looks after vc at the
   beginning of a word, so are, eve, ice, ore, use keep final -e. In this
   test c is any consonant, including w, x and y. This extension was
   suggested by Chris Emerson.

   -fully    -> -ful   treated like  -fulness -> -ful, and
   -tionally -> -tion  treated like  -tional  -> -tion

   both in Step 2. These were suggested by Hiranmay Ghosh, of New Delhi.

   Invariants proceed, succeed, exceed. Also suggested by Hiranmay Ghosh.

Additional modifications were made to incorperate this module into
nltk.  All such modifications are marked with \"--NLTK--\".
"""

from __future__ import print_function, unicode_literals

## --NLTK--
## Declare this module's documentation format.
__docformat__ = 'plaintext'

import re

from nltk.stem.api import StemmerI
from nltk.compat import python_2_unicode_compatible

@python_2_unicode_compatible
class PorterStemmer(StemmerI):

    ## --NLTK--
    ## Add a module docstring
    """
    A word stemmer based on the Porter stemming algorithm.

        Porter, M. \"An algorithm for suffix stripping.\"
        Program 14.3 (1980): 130-137.

    A few minor modifications have been made to Porter's basic
    algorithm.  See the source code of this module for more
    information.

    The Porter Stemmer requires that all tokens have string types.
    """

    # The main part of the stemming algorithm starts here.
    # Note that only lower case sequences are stemmed. Forcing to lower case
    # should be done before stem(...) is called.

    def __init__(self):

        ## --NEW--
        ## This is a table of irregular forms. It is quite short, but still
        ## reflects the errors actually drawn to Martin Porter's attention over
        ## a 20 year period!
        ##
        ## Extend it as necessary.
        ##
        ## The form of the table is:
        ##  {
        ##  "p1" : ["s11","s12","s13", ... ],
        ##  "p2" : ["s21","s22","s23", ... ],
        ##  ...
        ##  "pn" : ["sn1","sn2","sn3", ... ]
        ##  }
        ##
        ## String sij is mapped to paradigm form pi, and the main stemming
        ## process is then bypassed.

        irregular_forms = {
            "sky" :     ["sky", "skies"],
            "die" :     ["dying"],
            "lie" :     ["lying"],
            "tie" :     ["tying"],
            "news" :    ["news"],
            "inning" :  ["innings", "inning"],
            "outing" :  ["outings", "outing"],
            "canning" : ["cannings", "canning"],
            "howe" :    ["howe"],

            # --NEW--
            "proceed" : ["proceed"],
            "exceed"  : ["exceed"],
            "succeed" : ["succeed"], # Hiranmay Ghosh
            }

        self.pool = {}
        for key in irregular_forms:
            for val in irregular_forms[key]:
                self.pool[val] = key

        self.vowels = frozenset(['a', 'e', 'i', 'o', 'u'])

    def _cons(self, word, i):
        """cons(i) is TRUE <=> b[i] is a consonant."""
        if word[i] in self.vowels:
            return False
        if word[i] == 'y':
            if i == 0:
                return True
            else:
                return (not self._cons(word, i - 1))
        return True

    def _m(self, word, j):
        """m() measures the number of consonant sequences between k0 and j.
        if c is a consonant sequence and v a vowel sequence, and <..>
        indicates arbitrary presence,

           <c><v>       gives 0
           <c>vc<v>     gives 1
           <c>vcvc<v>   gives 2
           <c>vcvcvc<v> gives 3
           ....
        """
        n = 0
        i = 0
        while True:
            if i > j:
                return n
            if not self._cons(word, i):
                break
            i = i + 1
        i = i + 1

        while True:
            while True:
                if i > j:
                    return n
                if self._cons(word, i):
                    break
                i = i + 1
            i = i + 1
            n = n + 1

            while True:
                if i > j:
                    return n
                if not self._cons(word, i):
                    break
                i = i + 1
            i = i + 1

    def _vowelinstem(self, stem):
        """vowelinstem(stem) is TRUE <=> stem contains a vowel"""
        for i in range(len(stem)):
            if not self._cons(stem, i):
                return True
        return False

    def _doublec(self, word):
        """doublec(word) is TRUE <=> word ends with a double consonant"""
        if len(word) < 2:
            return False
        if (word[-1] != word[-2]):
            return False
        return self._cons(word, len(word)-1)

    def _cvc(self, word, i):
        """cvc(i) is TRUE <=>

        a) ( --NEW--) i == 1, and word[0] word[1] is vowel consonant, or

        b) word[i - 2], word[i - 1], word[i] has the form consonant -
           vowel - consonant and also if the second c is not w, x or y. this
           is used when trying to restore an e at the end of a short word.
           e.g.

               cav(e), lov(e), hop(e), crim(e), but
               snow, box, tray.
        """
        if i == 0: return False  # i == 0 never happens perhaps
        if i == 1: return (not self._cons(word, 0) and self._cons(word, 1))
        if not self._cons(word, i) or self._cons(word, i-1) or not self._cons(word, i-2): return False

        ch = word[i]
        if ch == 'w' or ch == 'x' or ch == 'y':
            return False

        return True

    def _step1ab(self, word):
        """step1ab() gets rid of plurals and -ed or -ing. e.g.

           caresses  ->  caress
           ponies    ->  poni
           sties     ->  sti
           tie       ->  tie        (--NEW--: see below)
           caress    ->  caress
           cats      ->  cat

           feed      ->  feed
           agreed    ->  agree
           disabled  ->  disable

           matting   ->  mat
           mating    ->  mate
           meeting   ->  meet
           milling   ->  mill
           messing   ->  mess

           meetings  ->  meet
        """
        if word[-1] == 's':
            if word.endswith("sses"):
                word = word[:-2]
            elif word.endswith("ies"):
                if len(word) == 4:
                    word = word[:-1]
                # this line extends the original algorithm, so that
                # 'flies'->'fli' but 'dies'->'die' etc
                else:
                    word = word[:-2]
            elif word[-2] != 's':
                word = word[:-1]

        ed_or_ing_trimmed = False
        if word.endswith("ied"):
            if len(word) == 4:
                word = word[:-1]
            else:
                word = word[:-2]
        # this line extends the original algorithm, so that
        # 'spied'->'spi' but 'died'->'die' etc

        elif word.endswith("eed"):
            if self._m(word, len(word)-4) > 0:
                word = word[:-1]


        elif word.endswith("ed") and self._vowelinstem(word[:-2]):
            word = word[:-2]
            ed_or_ing_trimmed = True
        elif word.endswith("ing") and self._vowelinstem(word[:-3]):
            word = word[:-3]
            ed_or_ing_trimmed = True

        if ed_or_ing_trimmed:
            if word.endswith("at") or word.endswith("bl") or word.endswith("iz"):
                word += 'e'
            elif self._doublec(word):
                if word[-1] not in ['l', 's', 'z']:
                    word = word[:-1]
            elif (self._m(word, len(word)-1) == 1 and self._cvc(word, len(word)-1)):
                word += 'e'

        return word

    def _step1c(self, word):
        """step1c() turns terminal y to i when there is another vowel in the stem.
        --NEW--: This has been modified from the original Porter algorithm so that y->i
        is only done when y is preceded by a consonant, but not if the stem
        is only a single consonant, i.e.

           (*c and not c) Y -> I

        So 'happy' -> 'happi', but
          'enjoy' -> 'enjoy'  etc

        This is a much better rule. Formerly 'enjoy'->'enjoi' and 'enjoyment'->
        'enjoy'. Step 1c is perhaps done too soon; but with this modification that
        no longer really matters.

        Also, the removal of the vowelinstem(z) condition means that 'spy', 'fly',
        'try' ... stem to 'spi', 'fli', 'tri' and conflate with 'spied', 'tried',
        'flies' ...
        """
        if word[-1] == 'y' and len(word) > 2 and self._cons(word, len(word) - 2):
            return word[:-1] + 'i'
        else:
            return word

    def _step2(self, word):
        """step2() maps double suffices to single ones.
        so -ization ( = -ize plus -ation) maps to -ize etc. note that the
        string before the suffix must give m() > 0.
        """
        if len(word) <= 1: # Only possible at this stage given unusual inputs to stem_word like 'oed'
            return word

        ch = word[-2]

        if ch == 'a':
            if word.endswith("ational"):
                return word[:-7] + "ate" if self._m(word, len(word)-8) > 0 else word
            elif word.endswith("tional"):
                return word[:-2] if self._m(word, len(word)-7) > 0 else word
            else:
                return word
        elif ch == 'c':
            if word.endswith("enci"):
                return word[:-4] + "ence" if self._m(word, len(word)-5) > 0 else word
            elif word.endswith("anci"):
                return word[:-4] + "ance" if self._m(word, len(word)-5) > 0 else word
            else:
                return word
        elif ch == 'e':
            if word.endswith("izer"):
                return word[:-1] if self._m(word, len(word)-5) > 0 else word
            else:
                return word
        elif ch == 'l':
            if word.endswith("bli"):
                return word[:-3] + "ble" if self._m(word, len(word)-4) > 0 else word # --DEPARTURE--
            # To match the published algorithm, replace "bli" with "abli" and "ble" with "able"
            elif word.endswith("alli"):
                # --NEW--
                if self._m(word, len(word)-5) > 0:
                    word = word[:-2]
                    return self._step2(word)
                else:
                    return word
            elif word.endswith("fulli"):
                return word[:-2] if self._m(word, len(word)-6) else word # --NEW--
            elif word.endswith("entli"):
                return word[:-2] if self._m(word, len(word)-6) else word
            elif word.endswith("eli"):
                return word[:-2] if self._m(word, len(word)-4) else word
            elif word.endswith("ousli"):
                return word[:-2] if self._m(word, len(word)-6) else word
            else:
                return word
        elif ch == 'o':
            if word.endswith("ization"):
                return word[:-7] + "ize" if self._m(word, len(word)-8) else word
            elif word.endswith("ation"):
                return word[:-5] + "ate" if self._m(word, len(word)-6) else word
            elif word.endswith("ator"):
                return word[:-4] + "ate" if self._m(word, len(word)-5) else word
            else:
                return word
        elif ch == 's':
            if word.endswith("alism"):
                return word[:-3] if self._m(word, len(word)-6) else word
            elif word.endswith("ness"):
                if word.endswith("iveness"):
                    return word[:-4] if self._m(word, len(word)-8) else word
                elif word.endswith("fulness"):
                    return word[:-4] if self._m(word, len(word)-8) else word
                elif word.endswith("ousness"):
                    return word[:-4] if self._m(word, len(word)-8) else word
                else:
                    return word
            else:
                return word
        elif ch == 't':
            if word.endswith("aliti"):
                return word[:-3] if self._m(word, len(word)-6) else word
            elif word.endswith("iviti"):
                return word[:-5] + "ive" if self._m(word, len(word)-6) else word
            elif word.endswith("biliti"):
                return word[:-6] + "ble" if self._m(word, len(word)-7) else word
            else:
                return word
        elif ch == 'g': # --DEPARTURE--
            if word.endswith("logi"):
                return word[:-1] if self._m(word, len(word) - 4) else word # --NEW-- (Barry Wilkins)
            # To match the published algorithm, pass len(word)-5 to _m instead of len(word)-4
            else:
                return word

        else:
            return word

    def _step3(self, word):
        """step3() deals with -ic-, -full, -ness etc. similar strategy to step2."""

        ch = word[-1]

        if ch == 'e':
            if word.endswith("icate"):
                return word[:-3] if self._m(word, len(word)-6) else word
            elif word.endswith("ative"):
                return word[:-5] if self._m(word, len(word)-6) else word
            elif word.endswith("alize"):
                return word[:-3] if self._m(word, len(word)-6) else word
            else:
                return word
        elif ch == 'i':
            if word.endswith("iciti"):
                return word[:-3] if self._m(word, len(word)-6) else word
            else:
                return word
        elif ch == 'l':
            if word.endswith("ical"):
                return word[:-2] if self._m(word, len(word)-5) else word
            elif word.endswith("ful"):
                return word[:-3] if self._m(word, len(word)-4) else word
            else:
                return word
        elif ch == 's':
            if word.endswith("ness"):
                return word[:-4] if self._m(word, len(word)-5) else word
            else:
                return word

        else:
            return word

    def _step4(self, word):
        """step4() takes off -ant, -ence etc., in context <c>vcvc<v>."""

        if len(word) <= 1: # Only possible at this stage given unusual inputs to stem_word like 'oed'
            return word

        ch = word[-2]

        if ch == 'a':
            if word.endswith("al"):
                return word[:-2] if self._m(word, len(word)-3) > 1 else word
            else:
                return word
        elif ch == 'c':
            if word.endswith("ance"):
                return word[:-4] if self._m(word, len(word)-5) > 1 else word
            elif word.endswith("ence"):
                return word[:-4] if self._m(word, len(word)-5) > 1 else word
            else:
                return word
        elif ch == 'e':
            if word.endswith("er"):
                return word[:-2] if self._m(word, len(word)-3) > 1 else word
            else:
                return word
        elif ch == 'i':
            if word.endswith("ic"):
                return word[:-2] if self._m(word, len(word)-3) > 1 else word
            else:
                return word
        elif ch == 'l':
            if word.endswith("able"):
                return word[:-4] if self._m(word, len(word)-5) > 1 else word
            elif word.endswith("ible"):
                return word[:-4] if self._m(word, len(word)-5) > 1 else word
            else:
                return word
        elif ch == 'n':
            if word.endswith("ant"):
                return word[:-3] if self._m(word, len(word)-4) > 1 else word
            elif word.endswith("ement"):
                return word[:-5] if self._m(word, len(word)-6) > 1 else word
            elif word.endswith("ment"):
                return word[:-4] if self._m(word, len(word)-5) > 1 else word
            elif word.endswith("ent"):
                return word[:-3] if self._m(word, len(word)-4) > 1 else word
            else:
                return word
        elif ch == 'o':
            if word.endswith("sion") or word.endswith("tion"): # slightly different logic to all the other cases
                return word[:-3] if self._m(word, len(word)-4) > 1 else word
            elif word.endswith("ou"):
                return word[:-2] if self._m(word, len(word)-3) > 1 else word
            else:
                return word
        elif ch == 's':
            if word.endswith("ism"):
                return word[:-3] if self._m(word, len(word)-4) > 1 else word
            else:
                return word
        elif ch == 't':
            if word.endswith("ate"):
                return word[:-3] if self._m(word, len(word)-4) > 1 else word
            elif word.endswith("iti"):
                return word[:-3] if self._m(word, len(word)-4) > 1 else word
            else:
                return word
        elif ch == 'u':
            if word.endswith("ous"):
                return word[:-3] if self._m(word, len(word)-4) > 1 else word
            else:
                return word
        elif ch == 'v':
            if word.endswith("ive"):
                return word[:-3] if self._m(word, len(word)-4) > 1 else word
            else:
                return word
        elif ch == 'z':
            if word.endswith("ize"):
                return word[:-3] if self._m(word, len(word)-4) > 1 else word
            else:
                return word
        else:
            return word

    def _step5(self, word):
        """step5() removes a final -e if m() > 1, and changes -ll to -l if
        m() > 1.
        """
        if word[-1] == 'e':
            a = self._m(word, len(word)-1)
            if a > 1 or (a == 1 and not self._cvc(word, len(word)-2)):
                word = word[:-1]
        if word.endswith('ll') and self._m(word, len(word)-1) > 1:
            word = word[:-1]

        return word

    def stem_word(self, p, i=0, j=None):
        """
        Returns the stem of p, or, if i and j are given, the stem of p[i:j+1].
        """
        ## --NLTK--
        if j is None and i == 0:
            word = p
        else:
            if j is None:
                j = len(p) - 1
            word = p[i:j+1]

        if word in self.pool:
            return self.pool[word]

        if len(word) <= 2:
            return word # --DEPARTURE--
        # With this line, strings of length 1 or 2 don't go through the
        # stemming process, although no mention is made of this in the
        # published algorithm. Remove the line to match the published
        # algorithm.

        word = self._step1ab(word)
        word = self._step1c(word)
        word = self._step2(word)
        word = self._step3(word)
        word = self._step4(word)
        word = self._step5(word)
        return word

    def _adjust_case(self, word, stem):
        lower = word.lower()

        ret = ""
        for x in range(len(stem)):
            if lower[x] == stem[x]:
                ret += word[x]
            else:
                ret += stem[x]

        return ret

    ## --NLTK--
    ## Don't use this procedure; we want to work with individual
    ## tokens, instead.  (commented out the following procedure)
    #def stem(self, text):
    #    parts = re.split("(\W+)", text)
    #    numWords = (len(parts) + 1)/2
    #
    #    ret = ""
    #    for i in xrange(numWords):
    #        word = parts[2 * i]
    #        separator = ""
    #        if ((2 * i) + 1) < len(parts):
    #            separator = parts[(2 * i) + 1]
    #
    #        stem = self.stem_word(string.lower(word), 0, len(word) - 1)
    #        ret = ret + self.adjust_case(word, stem)
    #        ret = ret + separator
    #    return ret

    ## --NLTK--
    ## Define a stem() method that implements the StemmerI interface.
    def stem(self, word):
        stem = self.stem_word(word.lower(), 0, len(word) - 1)
        return self._adjust_case(word, stem)

    ## --NLTK--
    ## Add a string representation function
    def __repr__(self):
        return '<PorterStemmer>'

## --NLTK--
## This test procedure isn't applicable.
#if __name__ == '__main__':
#    p = PorterStemmer()
#    if len(sys.argv) > 1:
#        for f in sys.argv[1:]:
#            with open(f, 'r') as infile:
#                while 1:
#                    w = infile.readline()
#                    if w == '':
#                        break
#                    w = w[:-1]
#                    print(p.stem(w))

##--NLTK--
## Added a demo() function

def demo():
    """
    A demonstration of the porter stemmer on a sample from
    the Penn Treebank corpus.
    """

    from nltk.corpus import treebank
    from nltk import stem

    stemmer = stem.PorterStemmer()

    orig = []
    stemmed = []
    for item in treebank.files()[:3]:
        for (word, tag) in treebank.tagged_words(item):
            orig.append(word)
            stemmed.append(stemmer.stem(word))

    # Convert the results to a string, and word-wrap them.
    results = ' '.join(stemmed)
    results = re.sub(r"(.{,70})\s", r'\1\n', results+' ').rstrip()

    # Convert the original to a string, and word wrap it.
    original = ' '.join(orig)
    original = re.sub(r"(.{,70})\s", r'\1\n', original+' ').rstrip()

    # Print the results.
    print('-Original-'.center(70).replace(' ', '*').replace('-', ' '))
    print(original)
    print('-Results-'.center(70).replace(' ', '*').replace('-', ' '))
    print(results)
    print('*'*70)

##--NLTK--