summaryrefslogtreecommitdiff
path: root/sample/testapp.py
blob: 15661344299e813f200d7474c1d87518bc6f76dd (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
import sys
import re
import snowballstemmer


def usage():
    print("testapp.py <algorithm> \"sentence\"...")

def main():
    argv = sys.argv
    if len(argv) < 1:
        usage()
        return
    algorithm = 'english'
    if len(argv) > 2:
        algorithm = argv[1]
        argv = argv[2:]
    else:
        argv = argv[1:]
    stemmer = snowballstemmer.stemmer(algorithm)
    splitter = re.compile(r"[\s\.-]")
    for arg in argv:
        for word in splitter.split(arg):
            if word == '':
                continue
            original = word.lower()
            print(original + " -> " + stemmer.stemWord(original))
main()