aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--data/dbverb.struct17
-rw-r--r--src/ellinika/elmorph.c217
-rw-r--r--src/ellinika/elmorph.scm430
3 files changed, 137 insertions, 127 deletions
diff --git a/data/dbverb.struct b/data/dbverb.struct
index 4ab6a37..af9d236 100644
--- a/data/dbverb.struct
+++ b/data/dbverb.struct
@@ -1,2 +1,19 @@
1-- This file is part of Ellinika
2-- Copyright (C) 2004, 2005, 2007 Sergey Poznyakoff
3--
4-- Ellinika is free software; you can redistribute it and/or modify
5-- it under the terms of the GNU General Public License as published by
6-- the Free Software Foundation; either version 3 of the License, or
7-- (at your option) any later version.
8--
9-- Ellinika is distributed in the hope that it will be useful,
10-- but WITHOUT ANY WARRANTY; without even the implied warranty of
11-- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12-- GNU General Public License for more details.
13--
14-- You should have received a copy of the GNU General Public License
15-- along with this program. If not, see <http://www.gnu.org/licenses/>.
16--
1set names utf8; 17set names utf8;
18
2DROP TABLE IF EXISTS verbflect; 19DROP TABLE IF EXISTS verbflect;
diff --git a/src/ellinika/elmorph.c b/src/ellinika/elmorph.c
index 5785f8d..f55e010 100644
--- a/src/ellinika/elmorph.c
+++ b/src/ellinika/elmorph.c
@@ -104,5 +104,8 @@ _elstr_alloc(const char *instr, int syl)
104 elstr->sylmap = NULL; 104 elstr->sylmap = NULL;
105 elstr->nsyl = 0;
106 elstr->acc_syl = 0;
107 elstr->acc_pos = 0;
105 if (syl) 108 if (syl)
106 _elstr_syllabize(elstr); 109 _elstr_syllabize(elstr);
107 110
108 SCM_RETURN_NEWSMOB(_elstr_tag, elstr); 111 SCM_RETURN_NEWSMOB(_elstr_tag, elstr);
@@ -142,2 +145,4 @@ _elstr_concat(struct elstr *dest, struct elstr *src, const char *func_name)
142 145
146 if (src->len == 0)
147 return;
143 wp = realloc(dest->str, 148 wp = realloc(dest->str,
@@ -221,2 +226,31 @@ _elstr_init()
221 226
227static SCM
228force_elstr(struct elstr **ep, SCM scm, int sylopt,
229 int arg, const char *func_name)
230{
231 struct elstr *elstr;
232
233 if (scm_is_elstr(scm)) {
234 elstr = (struct elstr*) SCM_CDR(scm);
235 } else {
236 SCM newscm;
237 char *str;
238
239 SCM_ASSERT(scm_is_string(scm), scm, arg, func_name);
240 str = scm_to_locale_string(scm);
241 newscm = _elstr_alloc(str, sylopt);
242 free(str);
243 if (newscm == SCM_EOL)
244 scm_misc_error(func_name,
245 "Invalid input string: ~S",
246 scm_list_1(scm));
247 scm = newscm;
248 elstr = (struct elstr*) SCM_CDR(newscm);
249 }
250 if (ep)
251 *ep = elstr;
252 return scm;
253}
254
255
222SCM_DEFINE_PUBLIC(scm_elstr_p, "elstr?", 1, 0, 0, 256SCM_DEFINE_PUBLIC(scm_elstr_p, "elstr?", 1, 0, 0,
@@ -239,10 +273,3 @@ SCM_DEFINE_PUBLIC(scm_string__elstr, "string->elstr", 1, 0, 0,
239 SCM_ASSERT(scm_is_string(string), string, SCM_ARG1, FUNC_NAME); 273 SCM_ASSERT(scm_is_string(string), string, SCM_ARG1, FUNC_NAME);
240 str = scm_to_locale_string(string); 274 return force_elstr(NULL, string, 1, SCM_ARG1, FUNC_NAME);
241 scm = _elstr_alloc(str, 1);
242 free(str);
243 if (scm == SCM_EOL)
244 scm_misc_error(FUNC_NAME,
245 "Invalid input string: ~S",
246 scm_list_1(string));
247 return scm;
248} 275}
@@ -277,5 +304,3 @@ SCM_DEFINE_PUBLIC(scm_elstr_length, "elstr-length", 1, 0, 0,
277 struct elstr *elstr; 304 struct elstr *elstr;
278 305 force_elstr(&elstr, el, 0, SCM_ARG1, FUNC_NAME);
279 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, FUNC_NAME);
280 elstr = (struct elstr*) SCM_CDR(el);
281 return scm_from_uint(elstr->len); 306 return scm_from_uint(elstr->len);
@@ -291,5 +316,3 @@ SCM_DEFINE_PUBLIC(scm_elstr_number_of_syllables, "elstr-number-of-syllables",
291 struct elstr *elstr; 316 struct elstr *elstr;
292 317 force_elstr(&elstr, el, 1, SCM_ARG1, FUNC_NAME);
293 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, FUNC_NAME);
294 elstr = (struct elstr*) SCM_CDR(el);
295 return scm_from_uint(elstr->nsyl); 318 return scm_from_uint(elstr->nsyl);
@@ -307,4 +330,3 @@ SCM_DEFINE_PUBLIC(scm_elstr_syllable_prop, "elstr-syllable-prop",
307 330
308 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, FUNC_NAME); 331 force_elstr(&elstr, el, 1, SCM_ARG1, FUNC_NAME);
309 elstr = (struct elstr*) SCM_CDR(el);
310 SCM_ASSERT(scm_is_integer(n), n, SCM_ARG2, FUNC_NAME); 332 SCM_ASSERT(scm_is_integer(n), n, SCM_ARG2, FUNC_NAME);
@@ -332,5 +354,3 @@ SCM_DEFINE_PUBLIC(scm_elstr_accent_position, "elstr-accent-position", 1, 0, 0,
332 struct elstr *elstr; 354 struct elstr *elstr;
333 355 force_elstr(&elstr, el, 0, SCM_ARG1, FUNC_NAME);
334 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, FUNC_NAME);
335 elstr = (struct elstr*) SCM_CDR(el);
336 return scm_from_uint(elstr->acc_pos); 356 return scm_from_uint(elstr->acc_pos);
@@ -346,5 +366,3 @@ SCM_DEFINE_PUBLIC(scm_elstr_accented_syllable, "elstr-accented-syllable",
346 struct elstr *elstr; 366 struct elstr *elstr;
347 367 force_elstr(&elstr, el, 1, SCM_ARG1, FUNC_NAME);
348 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, FUNC_NAME);
349 elstr = (struct elstr*) SCM_CDR(el);
350 return scm_from_uint(elstr->acc_syl); 368 return scm_from_uint(elstr->acc_syl);
@@ -364,4 +382,3 @@ SCM_DEFINE_PUBLIC(scm_elstr_syllable, "elstr-syllable",
364 382
365 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, FUNC_NAME); 383 force_elstr(&elstr, el, 1, SCM_ARG1, FUNC_NAME);
366 elstr = (struct elstr*) SCM_CDR(el);
367 SCM_ASSERT(scm_is_integer(n), n, SCM_ARG2, FUNC_NAME); 384 SCM_ASSERT(scm_is_integer(n), n, SCM_ARG2, FUNC_NAME);
@@ -400,4 +417,3 @@ SCM_DEFINE_PUBLIC(scm_elstr_character, "elstr-character",
400 417
401 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, FUNC_NAME); 418 force_elstr(&elstr, el, 0, SCM_ARG1, FUNC_NAME);
402 elstr = (struct elstr*) SCM_CDR(el);
403 SCM_ASSERT(scm_is_integer(n), n, SCM_ARG2, FUNC_NAME); 419 SCM_ASSERT(scm_is_integer(n), n, SCM_ARG2, FUNC_NAME);
@@ -425,9 +441,12 @@ _elstr_chgcase(SCM el, void (*chgfun)(unsigned *, size_t),
425 441
426 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, func_name); 442 if (destructive) {
427 elstr = (struct elstr*) SCM_CDR(el); 443 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, func_name);
428 if (destructive) 444 elstr = (struct elstr*) SCM_CDR(el);
429 scm = SCM_UNSPECIFIED; 445 scm = SCM_UNSPECIFIED;
430 else { 446 } else {
431 scm = _elstr_dup(elstr); 447 scm = force_elstr(&elstr, el, 1, SCM_ARG1, func_name);
432 elstr = (struct elstr*) SCM_CDR(scm); 448 if (scm == el) {
449 scm = _elstr_dup(elstr);
450 elstr = (struct elstr*) SCM_CDR(scm);
451 }
433 } 452 }
@@ -484,9 +503,12 @@ _elstr_deaccent(SCM el, int destructive, const char *func_name)
484 503
485 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, func_name); 504 if (destructive) {
486 elstr = (struct elstr*) SCM_CDR(el); 505 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, func_name);
487 if (destructive)
488 scm = SCM_UNSPECIFIED; 506 scm = SCM_UNSPECIFIED;
489 else { 507 elstr = (struct elstr*) SCM_CDR(el);
490 scm = _elstr_dup(elstr); 508 } else {
491 elstr = (struct elstr*) SCM_CDR(scm); 509 scm = force_elstr(&elstr, el, 1, SCM_ARG1, func_name);
510 if (scm == el) {
511 scm = _elstr_dup(elstr);
512 elstr = (struct elstr*) SCM_CDR(scm);
513 }
492 } 514 }
@@ -528,5 +550,9 @@ _elstr_set_accent(SCM el, SCM n, int destructive, const char *func_name)
528 550
529 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, func_name); 551 if (destructive) {
552 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, func_name);
553 elstr = (struct elstr*) SCM_CDR(el);
554 } else
555 scm = force_elstr(&elstr, el, 1, SCM_ARG1, func_name);
556
530 SCM_ASSERT(scm_is_integer(n), n, SCM_ARG2, func_name); 557 SCM_ASSERT(scm_is_integer(n), n, SCM_ARG2, func_name);
531 elstr = (struct elstr*) SCM_CDR(el);
532 num = scm_to_uint(n); 558 num = scm_to_uint(n);
@@ -544,3 +570,3 @@ _elstr_set_accent(SCM el, SCM n, int destructive, const char *func_name)
544 scm = SCM_UNSPECIFIED; 570 scm = SCM_UNSPECIFIED;
545 else { 571 else if (scm == el) {
546 scm = _elstr_dup(elstr); 572 scm = _elstr_dup(elstr);
@@ -600,5 +626,4 @@ SCM_DEFINE_PUBLIC(scm_elstr_char_prop_bitmask, "elstr-char-prop-bitmask",
600 626
601 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, FUNC_NAME); 627 force_elstr(&elstr, el, 0, SCM_ARG1, FUNC_NAME);
602 SCM_ASSERT(scm_is_integer(n), n, SCM_ARG2, FUNC_NAME); 628 SCM_ASSERT(scm_is_integer(n), n, SCM_ARG2, FUNC_NAME);
603 elstr = (struct elstr*) SCM_CDR(el);
604 num = scm_to_int(n); 629 num = scm_to_int(n);
@@ -686,9 +711,12 @@ _elstr_thema_aoristoy(SCM el, int destructive, const char *func_name)
686 711
687 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, func_name); 712 if (destructive) {
688 elstr = (struct elstr*) SCM_CDR(el); 713 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, func_name);
689 if (destructive) 714 elstr = (struct elstr*) SCM_CDR(el);
690 scm = SCM_UNSPECIFIED; 715 scm = SCM_UNSPECIFIED;
691 else { 716 } else {
692 scm = _elstr_dup(elstr); 717 scm = force_elstr(&elstr, el, 1, SCM_ARG1, func_name);
693 elstr = (struct elstr*) SCM_CDR(scm); 718 if (scm == el) {
719 scm = _elstr_dup(elstr);
720 elstr = (struct elstr*) SCM_CDR(scm);
721 }
694 } 722 }
@@ -728,6 +756,9 @@ _elstr_slice(SCM el, SCM n, SCM l, int destructive, const char *func_name)
728 756
729 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, func_name); 757 if (destructive) {
758 SCM_ASSERT(scm_is_elstr(el), el, SCM_ARG1, func_name);
759 elstr = (struct elstr*) SCM_CDR(el);
760 } else