Files
neuron/dist/morphology-cop.c
will.anderson 48ecd83421 fix: restore elb build — import paths, morphology deps, C master declarations header
- Fix wrong ELP import paths in soul.el, elp-input.el, studio.el
  (../foundation/elp/src → ../foundation/el/elp/src)
- Add missing import "morphology.el" to all 29 language morphology modules
- Recompile all affected dist/*.c with correct cross-module declarations
- Add dist/elp-c-decls.h: C-level master forward declarations for ELP package
  (enables elb --force-include to resolve undeclared cross-module calls)
2026-05-08 19:43:57 -05:00

557 lines
16 KiB
C

#include <stdint.h>
#include <stdlib.h>
#include "el_runtime.h"
el_val_t str_ends(el_val_t s, el_val_t suf);
el_val_t str_last_char(el_val_t s);
el_val_t str_last2(el_val_t s);
el_val_t str_last3(el_val_t s);
el_val_t str_drop_last(el_val_t s, el_val_t n);
el_val_t is_vowel(el_val_t c);
el_val_t morph_apply_suffix(el_val_t base, el_val_t suffix);
el_val_t en_irregular_plural(el_val_t word);
el_val_t en_irregular_singular(el_val_t word);
el_val_t en_irregular_verb(el_val_t base);
el_val_t en_verb_3sg(el_val_t base);
el_val_t en_should_double_final(el_val_t base);
el_val_t en_verb_past(el_val_t base);
el_val_t en_verb_gerund(el_val_t base);
el_val_t en_pluralize_regular(el_val_t singular);
el_val_t en_verb_form(el_val_t base, el_val_t tense, el_val_t person, el_val_t number);
el_val_t agree_determiner(el_val_t det, el_val_t noun);
el_val_t morph_pluralize(el_val_t noun, el_val_t profile);
el_val_t morph_map_canonical(el_val_t verb, el_val_t code);
el_val_t morph_conjugate(el_val_t verb, el_val_t tense, el_val_t person, el_val_t number, el_val_t profile);
el_val_t morph_inflect(el_val_t word, el_val_t features, el_val_t profile);
el_val_t pluralize(el_val_t singular);
el_val_t singularize(el_val_t plural);
el_val_t verb_form(el_val_t base, el_val_t tense, el_val_t person, el_val_t number);
el_val_t irregular_plural(el_val_t word);
el_val_t irregular_singular(el_val_t word);
el_val_t cop_str_ends(el_val_t s, el_val_t suf);
el_val_t cop_str_len(el_val_t s);
el_val_t cop_drop(el_val_t s, el_val_t n);
el_val_t cop_last_char(el_val_t s);
el_val_t cop_slot(el_val_t person, el_val_t number);
el_val_t cop_subject_prefix(el_val_t person, el_val_t number);
el_val_t cop_subject_prefix_gendered(el_val_t person, el_val_t gender, el_val_t number);
el_val_t cop_copula_particle(el_val_t gender, el_val_t number);
el_val_t cop_shwpe_present(el_val_t prefix);
el_val_t cop_shwpe_perfect(el_val_t prefix);
el_val_t cop_shwpe_future(el_val_t prefix);
el_val_t cop_bwk_present(el_val_t prefix);
el_val_t cop_bwk_perfect(el_val_t prefix);
el_val_t cop_bwk_future(el_val_t prefix);
el_val_t cop_nau_present(el_val_t prefix);
el_val_t cop_nau_perfect(el_val_t prefix);
el_val_t cop_nau_future(el_val_t prefix);
el_val_t cop_jw_present(el_val_t prefix);
el_val_t cop_jw_perfect(el_val_t prefix);
el_val_t cop_jw_future(el_val_t prefix);
el_val_t cop_di_present(el_val_t prefix);
el_val_t cop_di_perfect(el_val_t prefix);
el_val_t cop_di_future(el_val_t prefix);
el_val_t cop_is_copula(el_val_t verb);
el_val_t cop_known_verb_prefixed(el_val_t verb, el_val_t tense, el_val_t prefix);
el_val_t cop_regular_present(el_val_t prefix, el_val_t stem);
el_val_t cop_regular_perfect(el_val_t prefix, el_val_t stem);
el_val_t cop_regular_future(el_val_t prefix, el_val_t stem);
el_val_t cop_conjugate(el_val_t verb, el_val_t tense, el_val_t person, el_val_t number);
el_val_t cop_article(el_val_t gender, el_val_t number, el_val_t definite);
el_val_t cop_decline(el_val_t noun, el_val_t gram_case, el_val_t number);
el_val_t cop_noun_phrase(el_val_t noun, el_val_t gram_case, el_val_t number, el_val_t definite);
el_val_t cop_noun_phrase_gendered(el_val_t noun, el_val_t gram_case, el_val_t number, el_val_t definite, el_val_t gender);
el_val_t cop_map_canonical(el_val_t verb);
el_val_t cop_str_ends(el_val_t s, el_val_t suf) {
return str_ends_with(s, suf);
return 0;
}
el_val_t cop_str_len(el_val_t s) {
return str_len(s);
return 0;
}
el_val_t cop_drop(el_val_t s, el_val_t n) {
el_val_t len = str_len(s);
if (n >= len) {
return EL_STR("");
}
return str_slice(s, 0, (len - n));
return 0;
}
el_val_t cop_last_char(el_val_t s) {
el_val_t n = str_len(s);
if (n == 0) {
return EL_STR("");
}
return str_slice(s, (n - 1), n);
return 0;
}
el_val_t cop_slot(el_val_t person, el_val_t number) {
if (str_eq(person, EL_STR("first"))) {
if (str_eq(number, EL_STR("singular"))) {
return 0;
}
return 3;
}
if (str_eq(person, EL_STR("second"))) {
if (str_eq(number, EL_STR("singular"))) {
return 1;
}
return 4;
}
if (str_eq(number, EL_STR("singular"))) {
return 2;
}
return 5;
return 0;
}
el_val_t cop_subject_prefix(el_val_t person, el_val_t number) {
if (str_eq(person, EL_STR("first"))) {
if (str_eq(number, EL_STR("singular"))) {
return EL_STR("\xe2\xb2\x81");
}
return EL_STR("\xe2\xb2\x9b");
}
if (str_eq(person, EL_STR("second"))) {
if (str_eq(number, EL_STR("singular"))) {
return EL_STR("\xe2\xb2\x95");
}
return EL_STR("\xe2\xb2\xa7\xe2\xb2\x89\xe2\xb2\xa7\xe2\xb2\x89\xe2\xb2\x9b");
}
if (str_eq(number, EL_STR("singular"))) {
return EL_STR("\xcf\xa5");
}
return EL_STR("\xe2\xb2\xa5\xe2\xb2\x89");
return 0;
}
el_val_t cop_subject_prefix_gendered(el_val_t person, el_val_t gender, el_val_t number) {
if (str_eq(person, EL_STR("first"))) {
if (str_eq(number, EL_STR("singular"))) {
return EL_STR("\xe2\xb2\x81");
}
return EL_STR("\xe2\xb2\x9b");
}
if (str_eq(person, EL_STR("second"))) {
if (str_eq(number, EL_STR("singular"))) {
if (str_eq(gender, EL_STR("f"))) {
return EL_STR("\xe2\xb2\xa7\xe2\xb2\x89");
}
return EL_STR("\xe2\xb2\x95");
}
return EL_STR("\xe2\xb2\xa7\xe2\xb2\x89\xe2\xb2\xa7\xe2\xb2\x89\xe2\xb2\x9b");
}
if (str_eq(number, EL_STR("singular"))) {
if (str_eq(gender, EL_STR("f"))) {
return EL_STR("\xe2\xb2\xa5");
}
return EL_STR("\xcf\xa5");
}
return EL_STR("\xe2\xb2\xa5\xe2\xb2\x89");
return 0;
}
el_val_t cop_copula_particle(el_val_t gender, el_val_t number) {
if (str_eq(number, EL_STR("plural"))) {
return EL_STR("\xe2\xb2\x9b\xe2\xb2\x89");
}
if (str_eq(gender, EL_STR("f"))) {
return EL_STR("\xe2\xb2\xa7\xe2\xb2\x89");
}
return EL_STR("\xe2\xb2\xa1\xe2\xb2\x89");
return 0;
}
el_val_t cop_shwpe_present(el_val_t prefix) {
return el_str_concat(prefix, EL_STR("\xcf\xa3\xe2\xb2\x9f\xe2\xb2\x9f\xe2\xb2\xa1"));
return 0;
}
el_val_t cop_shwpe_perfect(el_val_t prefix) {
return el_str_concat(el_str_concat(EL_STR("\xe2\xb2\x81"), prefix), EL_STR("\xcf\xa3\xe2\xb2\xb1\xe2\xb2\xa1\xe2\xb2\x89"));
return 0;
}
el_val_t cop_shwpe_future(el_val_t prefix) {
return el_str_concat(prefix, EL_STR("\xe2\xb2\x9b\xe2\xb2\x81\xcf\xa3\xe2\xb2\xb1\xe2\xb2\xa1\xe2\xb2\x89"));
return 0;
}
el_val_t cop_bwk_present(el_val_t prefix) {
return el_str_concat(prefix, EL_STR("\xe2\xb2\x83\xe2\xb2\xb1\xe2\xb2\x95"));
return 0;
}
el_val_t cop_bwk_perfect(el_val_t prefix) {
return el_str_concat(el_str_concat(EL_STR("\xe2\xb2\x81"), prefix), EL_STR("\xe2\xb2\x83\xe2\xb2\xb1\xe2\xb2\x95"));
return 0;
}
el_val_t cop_bwk_future(el_val_t prefix) {
return el_str_concat(prefix, EL_STR("\xe2\xb2\x9b\xe2\xb2\x81\xe2\xb2\x83\xe2\xb2\xb1\xe2\xb2\x95"));
return 0;
}
el_val_t cop_nau_present(el_val_t prefix) {
return el_str_concat(prefix, EL_STR("\xe2\xb2\x9b\xe2\xb2\x81\xe2\xb2\xa9"));
return 0;
}
el_val_t cop_nau_perfect(el_val_t prefix) {
return el_str_concat(el_str_concat(EL_STR("\xe2\xb2\x81"), prefix), EL_STR("\xe2\xb2\x9b\xe2\xb2\x81\xe2\xb2\xa9"));
return 0;
}
el_val_t cop_nau_future(el_val_t prefix) {
return el_str_concat(prefix, EL_STR("\xe2\xb2\x9b\xe2\xb2\x81\xe2\xb2\x9b\xe2\xb2\x81\xe2\xb2\xa9"));
return 0;
}
el_val_t cop_jw_present(el_val_t prefix) {
return el_str_concat(prefix, EL_STR("\xcf\xab\xe2\xb2\xb1"));
return 0;
}
el_val_t cop_jw_perfect(el_val_t prefix) {
return el_str_concat(el_str_concat(EL_STR("\xe2\xb2\x81"), prefix), EL_STR("\xcf\xab\xe2\xb2\xb1"));
return 0;
}
el_val_t cop_jw_future(el_val_t prefix) {
return el_str_concat(prefix, EL_STR("\xe2\xb2\x9b\xe2\xb2\x81\xcf\xab\xe2\xb2\xb1"));
return 0;
}
el_val_t cop_di_present(el_val_t prefix) {
return el_str_concat(prefix, EL_STR("\xcf\xaf"));
return 0;
}
el_val_t cop_di_perfect(el_val_t prefix) {
return el_str_concat(el_str_concat(EL_STR("\xe2\xb2\x81"), prefix), EL_STR("\xcf\xaf"));
return 0;
}
el_val_t cop_di_future(el_val_t prefix) {
return el_str_concat(prefix, EL_STR("\xe2\xb2\x9b\xe2\xb2\x81\xcf\xaf"));
return 0;
}
el_val_t cop_is_copula(el_val_t verb) {
if (str_eq(verb, EL_STR("\xcf\xa3\xcf\x89\xcf\x80\xce\xb5"))) {
return 1;
}
if (str_eq(verb, EL_STR("shwpe"))) {
return 1;
}
if (str_eq(verb, EL_STR("be"))) {
return 1;
}
return 0;
return 0;
}
el_val_t cop_known_verb_prefixed(el_val_t verb, el_val_t tense, el_val_t prefix) {
if (str_eq(verb, EL_STR("\xcf\xa3\xcf\x89\xcf\x80\xce\xb5"))) {
if (str_eq(tense, EL_STR("present"))) {
return cop_shwpe_present(prefix);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_shwpe_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_shwpe_future(prefix);
}
return cop_shwpe_present(prefix);
}
if (str_eq(verb, EL_STR("shwpe"))) {
if (str_eq(tense, EL_STR("present"))) {
return cop_shwpe_present(prefix);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_shwpe_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_shwpe_future(prefix);
}
return cop_shwpe_present(prefix);
}
if (str_eq(verb, EL_STR("bwk"))) {
if (str_eq(tense, EL_STR("present"))) {
return cop_bwk_present(prefix);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_bwk_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_bwk_future(prefix);
}
return cop_bwk_present(prefix);
}
if (str_eq(verb, EL_STR("\xe2\xb2\x83\xe2\xb2\xb1\xe2\xb2\x95"))) {
if (str_eq(tense, EL_STR("present"))) {
return cop_bwk_present(prefix);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_bwk_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_bwk_future(prefix);
}
return cop_bwk_present(prefix);
}
if (str_eq(verb, EL_STR("go"))) {
if (str_eq(tense, EL_STR("present"))) {
return cop_bwk_present(prefix);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_bwk_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_bwk_future(prefix);
}
return cop_bwk_present(prefix);
}
if (str_eq(verb, EL_STR("nau"))) {
if (str_eq(tense, EL_STR("present"))) {
return cop_nau_present(prefix);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_nau_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_nau_future(prefix);
}
return cop_nau_present(prefix);
}
if (str_eq(verb, EL_STR("\xe2\xb2\x9b\xe2\xb2\x81\xe2\xb2\xa9"))) {
if (str_eq(tense, EL_STR("present"))) {
return cop_nau_present(prefix);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_nau_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_nau_future(prefix);
}
return cop_nau_present(prefix);
}
if (str_eq(verb, EL_STR("see"))) {
if (str_eq(tense, EL_STR("present"))) {
return cop_nau_present(prefix);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_nau_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_nau_future(prefix);
}
return cop_nau_present(prefix);
}
if (str_eq(verb, EL_STR("jw"))) {
if (str_eq(tense, EL_STR("present"))) {
return cop_jw_present(prefix);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_jw_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_jw_future(prefix);
}
return cop_jw_present(prefix);
}
if (str_eq(verb, EL_STR("\xcf\xab\xe2\xb2\xb1"))) {
if (str_eq(tense, EL_STR("present"))) {
return cop_jw_present(prefix);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_jw_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_jw_future(prefix);
}
return cop_jw_present(prefix);
}
if (str_eq(verb, EL_STR("say"))) {
if (str_eq(tense, EL_STR("present"))) {
return cop_jw_present(prefix);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_jw_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_jw_future(prefix);
}
return cop_jw_present(prefix);
}
if (str_eq(verb, EL_STR("di"))) {
if (str_eq(tense, EL_STR("present"))) {
return cop_di_present(prefix);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_di_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_di_future(prefix);
}
return cop_di_present(prefix);
}
if (str_eq(verb, EL_STR("\xcf\xaf"))) {
if (str_eq(tense, EL_STR("present"))) {
return cop_di_present(prefix);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_di_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_di_future(prefix);
}
return cop_di_present(prefix);
}
if (str_eq(verb, EL_STR("give"))) {
if (str_eq(tense, EL_STR("present"))) {
return cop_di_present(prefix);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_di_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_di_future(prefix);
}
return cop_di_present(prefix);
}
return EL_STR("");
return 0;
}
el_val_t cop_regular_present(el_val_t prefix, el_val_t stem) {
return el_str_concat(prefix, stem);
return 0;
}
el_val_t cop_regular_perfect(el_val_t prefix, el_val_t stem) {
return el_str_concat(el_str_concat(EL_STR("\xe2\xb2\x81"), prefix), stem);
return 0;
}
el_val_t cop_regular_future(el_val_t prefix, el_val_t stem) {
return el_str_concat(el_str_concat(prefix, EL_STR("\xe2\xb2\x9b\xe2\xb2\x81")), stem);
return 0;
}
el_val_t cop_conjugate(el_val_t verb, el_val_t tense, el_val_t person, el_val_t number) {
el_val_t prefix = cop_subject_prefix(person, number);
if (str_eq(verb, EL_STR("be"))) {
if (str_eq(tense, EL_STR("present"))) {
return EL_STR("");
}
if (str_eq(tense, EL_STR("past"))) {
return cop_shwpe_perfect(prefix);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_shwpe_future(prefix);
}
return EL_STR("");
}
el_val_t known = cop_known_verb_prefixed(verb, tense, prefix);
if (!str_eq(known, EL_STR(""))) {
return known;
}
if (str_eq(tense, EL_STR("present"))) {
return cop_regular_present(prefix, verb);
}
if (str_eq(tense, EL_STR("past"))) {
return cop_regular_perfect(prefix, verb);
}
if (str_eq(tense, EL_STR("future"))) {
return cop_regular_future(prefix, verb);
}
return verb;
return 0;
}
el_val_t cop_article(el_val_t gender, el_val_t number, el_val_t definite) {
if (str_eq(definite, EL_STR("true"))) {
if (str_eq(number, EL_STR("plural"))) {
return EL_STR("\xe2\xb2\x9b");
}
if (str_eq(gender, EL_STR("f"))) {
return EL_STR("\xe2\xb2\xa7");
}
return EL_STR("\xe2\xb2\xa1");
}
if (str_eq(number, EL_STR("plural"))) {
return EL_STR("\xcf\xa9\xe2\xb2\x89\xe2\xb2\x9b");
}
return EL_STR("\xe2\xb2\x9f\xe2\xb2\xa9");
return 0;
}
el_val_t cop_decline(el_val_t noun, el_val_t gram_case, el_val_t number) {
if (str_eq(number, EL_STR("singular"))) {
return noun;
}
if (cop_str_ends(noun, EL_STR("\xe2\xb2\x89"))) {
el_val_t stem = cop_drop(noun, 1);
return el_str_concat(stem, EL_STR("\xe2\xb2\x9f\xe2\xb2\x9f\xe2\xb2\xa9\xe2\xb2\x89"));
}
return noun;
return 0;
}
el_val_t cop_noun_phrase(el_val_t noun, el_val_t gram_case, el_val_t number, el_val_t definite) {
el_val_t form = cop_decline(noun, gram_case, number);
el_val_t art = cop_article(EL_STR("m"), number, definite);
if (str_eq(definite, EL_STR("true"))) {
return el_str_concat(art, form);
}
if (str_eq(definite, EL_STR("false"))) {
return el_str_concat(art, form);
}
return form;
return 0;
}
el_val_t cop_noun_phrase_gendered(el_val_t noun, el_val_t gram_case, el_val_t number, el_val_t definite, el_val_t gender) {
el_val_t form = cop_decline(noun, gram_case, number);
el_val_t art = cop_article(gender, number, definite);
if (str_eq(definite, EL_STR("true"))) {
return el_str_concat(art, form);
}
if (str_eq(definite, EL_STR("false"))) {
return el_str_concat(art, form);
}
return form;
return 0;
}
el_val_t cop_map_canonical(el_val_t verb) {
if (str_eq(verb, EL_STR("be"))) {
return EL_STR("be");
}
if (str_eq(verb, EL_STR("go"))) {
return EL_STR("bwk");
}
if (str_eq(verb, EL_STR("see"))) {
return EL_STR("nau");
}
if (str_eq(verb, EL_STR("say"))) {
return EL_STR("jw");
}
if (str_eq(verb, EL_STR("speak"))) {
return EL_STR("jw");
}
if (str_eq(verb, EL_STR("give"))) {
return EL_STR("di");
}
return verb;
return 0;
}