diff --git a/test/corpus_svg.py b/test/corpus_svg.py new file mode 100644 index 0000000000000000000000000000000000000000..46b1956b9fea8d344310cbcc69112b6f76e98297 --- /dev/null +++ b/test/corpus_svg.py @@ -0,0 +1,23 @@ +import sys +import grew + +grew.init(True) # local usage --> run grewpy_dev + +gsd = grew.corpus (["UD_French-GSD/fr_gsd-ud-dev.conllu", "UD_French-GSD/fr_gsd-ud-test.conllu", ]) + +# graph = grew.corpus_get (gsd, "fr-ud-dev_00002") +# print(graph) + +print (grew.corpus_size (gsd)) + +ids = grew.corpus_sent_ids(gsd) +print (ids[10:20]) + +try: + graph = grew.corpus_get ("fr-ud-dev_00002", gsd) + svg = grew.graph_svg(graph) + print(svg) +except grew.utils.GrewError as err: + print ("ERROR: %s" % err) + + diff --git a/test/search_corpus.py b/test/search_corpus.py new file mode 100644 index 0000000000000000000000000000000000000000..3ac1be6f8e8d326187416bc8968a613fbaecbcb2 --- /dev/null +++ b/test/search_corpus.py @@ -0,0 +1,13 @@ + +# Import the library +import grew + +# Run the grew tool in background +grew.init() + +# Load the corpus file (of course, you will have to update the filename to your system) +c = grew.corpus ("/users/guillaum/gitlab/deep-sequoia/trunk/sequoia.deep_and_surf.conll") + +# Search for an empty pattern and print the number of occurences +r = grew.corpus_search ("pattern {}", c) +print (len (r)) \ No newline at end of file diff --git a/test/set_gender.py b/test/set_gender.py new file mode 100644 index 0000000000000000000000000000000000000000..3edc39129afd942ca14e4811067647a1daa283e5 --- /dev/null +++ b/test/set_gender.py @@ -0,0 +1,27 @@ +import grew +grew.init(True) + +g = grew.graph('''graph { + W1 [form="le", lemma="le", cat=DET]; + W2 [form="garçon", lemma="garçon", cat=NOUN]; + W3 [form="voit", lemma="voir", cat=VERB]; + W4 [form="la", lemma="le", cat=DET]; + W5 [form="maison", lemma="maison", cat=NOUN]; + }''') + +r = grew.grs(''' +rule set_gender { + pattern { N [upos=NOUN, !Gender, lemma=lex.noun] } + commands { N.Gender = lex.Gender } +} +#BEGIN lex +noun Gender +%------------- +garçon Masc +maison Fem +#END +''') + +out = grew.run(r, g, 'Iter(set_gender)') + +print (out) diff --git a/test/test_corpus_count.py b/test/test_corpus_count.py new file mode 100644 index 0000000000000000000000000000000000000000..07e2e49b0c0817829d0fc45d2659a137b5f2f68b --- /dev/null +++ b/test/test_corpus_count.py @@ -0,0 +1,13 @@ +import grew +import sys +import json + +grew.init(True) # local usage --> run grewpy_dev + +seq = grew.corpus(["UD_French-GSD/fr_gsd-ud-test.conllu", "UD_French-GSD/fr_gsd-ud-dev.conllu", "UD_French-GSD/fr_gsd-ud-train.conllu"]) + + +print ("|NOUN| = " + json.dumps (grew.corpus_count("pattern { N[upos=NOUN] }", seq))) +print ("|NOUN| -[cop]-> = " + json.dumps (grew.corpus_count("pattern { N[upos=NOUN]; N -[cop]-> * }", seq))) +print (" -[nsubj]-> |NOUN| = " + json.dumps (grew.corpus_count("pattern { * -[nsubj]-> N; N[upos=NOUN]; }", seq))) +