0001-added-part-of-speech-tag-to-word.patch

D. Hamann, 09/24/2017 07:17 PM

Download (2.87 KB)

View differences:

proto/stable/rst/dialog/SpeechHypothesis.proto
32 32
         */
33 33
        optional timing.Interval timestamps = 2;
34 34

  
35
        /**
36
         * Container for part of speech tags as defined by the NEGRA-corpus.
37
         * See <a href="http://www.coli.uni-saarland.de/projects/sfb378/negra-corpus/negra-corpus.html">here</a>.
38
         * Differences to the NEGRA-corpus are ("$," to "KOMM"), ("$." to "END") and ("$(" to "IPNCT").
39
         */
40
        enum PosTag {
41
                ADJA = 1;
42
                ADJD = 2;
43
                ADV = 3;
44
                APPR = 4;
45
                APPRART = 5;
46
                APPO = 6;
47
                APZR = 7;
48
                ART = 8;
49
                CARD = 9;
50
                FM = 10;
51
                ITJ = 11;
52
                ORD = 12;
53
                KOUI = 13;
54
                KOUS = 14;
55
                KON = 15;
56
                KOKOM = 16;
57
                NN = 17;
58
                NE = 18;
59
                PDS = 19;
60
                PDAT = 20;
61
                PIS = 21;
62
                PIAT = 22;
63
                PIDAT = 23;
64
                PPER = 24;
65
                PPOSS = 25;
66
                PPOSAT = 26;
67
                PRELS = 27;
68
                PRELAT = 28;
69
                PRF = 29;
70
                PWS = 30;
71
                PWAT = 31;
72
                PWAV = 32;
73
                PAV = 33;
74
                PTKZU = 34;
75
                PTKNEG = 35;
76
                PTKVZ = 36;
77
                PTKANT = 37;
78
                PTKA = 38;
79
                SGML = 39;
80
                SPELL = 40;
81
                TRUNC = 41;
82
                VVFIN = 42;
83
                VVIMP = 43;
84
                VVINF = 44;
85
                VVIZU = 45;
86
                VVPP = 46;
87
                VAFIN = 47;
88
                VAIMP = 48;
89
                VAINF = 49;
90
                VAPP = 50;
91
                VMFIN = 51;
92
                VMINF = 52;
93
                VMPP = 53;
94
                XY = 54;
95
                KOMM = 55;
96
                END = 56;
97
                IPNCT = 57;
98
        }
99

  
100
        /**
101
         * Part of speech tag for this word.
102
         * See <a href="http://www.coli.uni-saarland.de/projects/sfb378/negra-corpus/stts.asc">here</a>
103
         * for more information.
104
         */
105
        optional PosTag part_of_speech_tag = 3;
106

  
35 107
    }
36 108

  
37 109
    /**
38
-