-
Notifications
You must be signed in to change notification settings - Fork 0
/
verb.cc
138 lines (124 loc) · 3.97 KB
/
verb.cc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
// Copyright (C) 2011 Petr Machata
//
// This program is free software: you can redistribute it and/or modify
// it under the terms of the GNU Affero General Public License as
// published by the Free Software Foundation, either version 3 of the
// License, or (at your option) any later version.
//
// This program is distributed in the hope that it will be useful, but
// WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
// Affero General Public License for more details.
//
// You should have received a copy of the GNU Affero General Public
// License along with this program. If not, see
// <http://www.gnu.org/licenses/>.
#include "verb.hh"
#include "forms.hh"
#include "rus_gramtab.hh"
#include "format.hh"
#include "adjective.hh"
#include <boost/format.hpp>
#include <iostream>
verb_handler::verb_handler (id_allocator &parent)
: pos_handler (parent, "verb")
{
}
void
verb_handler::fill_hdf (CAgramtab *agramtab,
lemmatize::const_iterator const &it,
hdf_data_map &data) const
{
lemmatize::forms forms = it.forms ();
for (lemmatize::forms::const_iterator ft = forms.begin ();
ft != forms.end (); ++ft)
{
std::vector<grammeme> gs = ft.ancode ().grammemes ();
gram_code_t number = gm__invalid;
gram_code_t voice = gm__invalid;
gram_code_t gender = gm__invalid;
gram_code_t tense = gm__invalid;
gram_code_t person = gm__invalid;
gram_code_t gcase = gm__invalid;
bool imperative = false;
bool animate = false;
bool inanimate = false;
std::vector<gram_code_t> extra;
for (std::vector<grammeme>::const_iterator gt = gs.begin ();
gt != gs.end (); ++gt)
{
gram_code_t code = gt->value_as<gram_code_t> ();
if (!extract_rus_number (number, code)
&& !extract_rus_voice (voice, code)
&& !extract_rus_gender (gender, code)
&& !extract_rus_tense (tense, code)
&& !extract_rus_person (person, code)
&& !extract_rus_case (gcase, code))
{
if (code == gm_imperative)
imperative = true;
else if (code == gm_animate)
animate = true;
else if (code == gm_inanimate)
inanimate = true;
else if (code == gm_colloquial)
extra.push_back (code);
else
std::cerr << (boost::format ("Unhandled grammeme %s\n")
% format_rus (code));
}
}
std::string key;
// Forms with animate and/or inanimate attributes are adjectival
// participles.
if (animate || inanimate)
{
std::string sub_key = adjective_handler::format_form_key
(gm_positive, gcase, number, gender, animate, inanimate, false);
key = str (boost::format ("adj_participle.%s.%s.%s")
% format_rus (voice)
% format_rus (tense)
% sub_key);
}
else if (tense == gm__invalid)
{
if (imperative)
key = str (boost::format ("%s.%s.%s")
% format_rus (gm_imperative)
% format_rus (number)
% format_rus (person));
else
key = "infinitive";
}
// These are adverbial participles.
else if (number == gm__invalid)
key = str (boost::format ("adv_participle.%s")
% format_rus (tense));
else if (tense == gm_future || tense == gm_present)
key = str (boost::format ("%s.%s.%s")
% format_rus (tense)
% format_rus (number)
% format_rus (person));
// past tense
else
{
if (number == gm_singular)
key = str (boost::format ("%s.%s")
% format_rus (tense)
% format_rus (gender));
else
key = str (boost::format ("%s.%s")
% format_rus (tense)
% format_rus (number));
}
data[key].push_back (std::make_pair (*ft, ft.accent ()));
if (extra.size () > 0)
{
std::string subkey = str (boost::format ("%s.%d.extra")
% key % (data[key].size () - 1));
for (std::vector<gram_code_t>::const_iterator it = extra.begin ();
it != extra.end (); ++it)
data[subkey].push_back (std::make_pair (format_rus (*it), -1));
}
}
}