Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
GUILLAUME Bruno
libcaml-conll
Commits
67c4375c
Commit
67c4375c
authored
Oct 31, 2020
by
Bruno Guillaume
Browse files
update UD feature list
parent
1fb9c6bf
Changes
2
Hide whitespace changes
Inline
Side-by-side
src/conllx.ml
View file @
67c4375c
...
...
@@ -206,21 +206,25 @@ module Conllx_config = struct
(* ---------------------------------------------------------------------------------------------------- *)
let
ud_features
=
[
(* UD features collected from data folder on 2020/10/27 *)
"Abbr"
;
"AdjType"
;
"AdpType"
;
"AdvType"
;
"Agent"
;
"Agglutination"
;
"Analyt"
;
"Animacy"
;
"Animacy[gram]"
;
"Animacy[obj]"
;
"Aspect"
;
"Case"
;
"Clitic"
;
"Clusivity"
;
"Clusivity[obj]"
;
"Clusivity[psor]"
;
"Clusivity[subj]"
;
"Compound"
;
"ConjType"
;
"Connegative"
;
"Contrast"
;
"Copula"
;
"Definite"
;
"Definite[obj]"
;
"Degree"
;
"Deixis"
;
"DeixisRef"
;
"Deriv"
;
"Derivation"
;
"Dialect"
;
"Distance"
;
"Echo"
;
"Emphatic"
;
"Evident"
;
"Focus"
;
"FocusType"
;
"Foreign"
;
"Form"
;
"Gender"
;
"Gender[abs]"
;
"Gender[acc]"
;
"Gender[ben]"
;
"Gender[dat]"
;
"Gender[erg]"
;
"Gender[obj]"
;
"Gender[psor]"
;
"HebBinyan"
;
"HebExistential"
;
"HebSource"
;
"Hyph"
;
"InfForm"
;
"Link"
;
"Mood"
;
"Morph"
;
"Mutation"
;
"NameType"
;
"NegationType"
;
"NounClass"
;
"NounClass[obj]"
;
"NounClass[subj]"
;
"NounForm"
;
"NounType"
;
"NumForm"
;
"Gender[psor]"
;
"Gender[subj]"
;
"HebBinyan"
;
"HebExistential"
;
"HebSource"
;
"Hyph"
;
"InfForm"
;
"Link"
;
"Mood"
;
"Morph"
;
"Mutation"
;
"NameType"
;
"NegationType"
;
"Nomzr"
;
"Noun"
;
"NounClass"
;
"NounClass[obj]"
;
"NounClass[subj]"
;
"NounForm"
;
"NounType"
;
"NumForm"
;
"NumType"
;
"NumValue"
;
"Number"
;
"Number[abs]"
;
"Number[acc]"
;
"Number[dat]"
;
"Number[erg]"
;
"Number[obj]"
;
"Number[psed]"
;
"Number[psor]"
;
"Number[subj]"
;
"Orth"
;
"PartForm"
;
"PartType"
;
"Person"
;
"Person[abs]"
;
"Person[acc]"
;
"Number[psed]"
;
"Number[psor]"
;
"Number[subj]"
;
"Orth"
;
"PartForm"
;
"PartType"
;
"Person"
;
"Person12Pl"
;
"Person12Sg"
;
"Person[abs]"
;
"Person[acc]"
;
"Person[dat]"
;
"Person[erg]"
;
"Person[obj]"
;
"Person[psor]"
;
"Person[sdat]"
;
"Person[subj]"
;
"Polarity"
;
"Polite"
;
"Polite[abs]"
;
"Polite[dat]"
;
"Polite[erg]"
;
"Position"
;
"Poss"
;
"PossNumber"
;
"PossPerson"
;
"Prefix"
;
"PrepCase"
;
"PrepForm"
;
"Preverb"
;
"PronType"
;
"Pun"
;
"PunctSide"
;
"PunctType"
;
"RefRole"
;
"Reflex"
;
"Register"
;
"Polite[abs]"
;
"Polite[dat]"
;
"Polite[erg]"
;
"Position"
;
"Poss"
;
"PossNumber"
;
"PossPerson"
;
"Possessed"
;
"Prefix"
;
"PrepCase"
;
"PrepForm"
;
"Preverb"
;
"PronClass"
;
"PronGend"
;
"PronNum"
;
"PronPers"
;
"PronType"
;
"Proper"
;
"Pun"
;
"PunctSide"
;
"PunctType"
;
"Red"
;
"RefRole"
;
"Reflex"
;
"Register"
;
(* "Rel"; declared for Tupinamba but unused *)
"Relative"
;
"Strength"
;
"Style"
;
"SubGender"
;
"Subcat"
;
"Tense"
;
"Topic"
;
"Typo"
;
"Uninflect"
;
"Valency"
;
"Variant"
;
"VerbClass"
;
"VerbForm"
;
"VerbType"
;
"Voice"
;
"Xtra"
;
(* SUD features *)
"Shared"
;
]
...
...
@@ -283,6 +287,10 @@ module Conllx_config = struct
|
s
->
Error
.
error
"Unknown config `%s` (available values are: `basic`, `ud`, `sud`, `sequoia`, `orfeo`)"
s
let
get_name
t
=
t
.
name
let
remove_from_feats
feature_name
config
=
{
config
with
feats
=
CCList
.
remove
~
eq
:
(
=
)
~
key
:
feature_name
config
.
feats
}
end
...
...
src/conllx.mli
View file @
67c4375c
...
...
@@ -29,6 +29,8 @@ module Conllx_config: sig
val
build
:
string
->
t
val
get_name
:
t
->
string
val
remove_from_feats
:
string
->
t
->
t
end
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment