#include #include #include #include #include "test_macros.h" #include #include #include static int test_lm_vals(ngram_model_t *model) { int32 n_used; TEST_ASSERT(model); TEST_EQUAL(ngram_wid(model, ""), 0); TEST_EQUAL(strcmp(ngram_word(model, 0), ""), 0); TEST_EQUAL(ngram_wid(model, "absolute"), 13); TEST_EQUAL(strcmp(ngram_word(model, 13), "absolute"), 0); /* Test unigrams. */ TEST_EQUAL_LOG(ngram_score(model, "", NULL), -75346); TEST_EQUAL_LOG(ngram_bg_score(model, ngram_wid(model, ""), NGRAM_INVALID_WID, &n_used), -75346); TEST_EQUAL(n_used, 1); TEST_EQUAL_LOG(ngram_score(model, "sphinxtrain", NULL), -64208); TEST_EQUAL_LOG(ngram_bg_score(model, ngram_wid(model, "sphinxtrain"), NGRAM_INVALID_WID, &n_used), -64208); TEST_EQUAL(n_used, 1); printf("FOO %d\n", ngram_score(model, "huggins", "david", NULL)); printf("FOO %d\n", ngram_score(model, "daines", "huggins", "david", NULL)); /* Test bigrams. */ TEST_EQUAL_LOG(ngram_score(model, "huggins", "david", NULL), -831); /* Test trigrams. */ TEST_EQUAL_LOG(ngram_score(model, "daines", "huggins", "david", NULL), -9450); return 0; } int main(int argc, char *argv[]) { logmath_t *lmath; ngram_model_t *model; /* Initialize a logmath object to pass to ngram_read */ lmath = logmath_init(1.0001, 0, 0); E_INFO("Converting ARPA to BIN\n"); model = ngram_model_read(NULL, LMDIR "/100.lm.bz2", NGRAM_ARPA, lmath); test_lm_vals(model); TEST_EQUAL(0, ngram_model_write(model, "100.tmp.lm.bin", NGRAM_BIN)); ngram_model_free(model); E_INFO("Converting BIN to ARPA\n"); model = ngram_model_read(NULL, LMDIR "/100.lm.bin", NGRAM_BIN, lmath); test_lm_vals(model); TEST_EQUAL(0, ngram_model_write(model, "100.tmp.lm", NGRAM_ARPA)); ngram_model_free(model); E_INFO("Testing converted BIN\n"); model = ngram_model_read(NULL, "100.tmp.lm.bin", NGRAM_BIN, lmath); test_lm_vals(model); ngram_model_free(model); E_INFO("Testing converted ARPA\n"); model = ngram_model_read(NULL, "100.tmp.lm", NGRAM_ARPA, lmath); test_lm_vals(model); ngram_model_free(model); E_INFO("Converting ARPA back to BIN\n"); model = ngram_model_read(NULL, "100.tmp.lm", NGRAM_ARPA, lmath); test_lm_vals(model); TEST_EQUAL(0, ngram_model_write(model, "100.tmp.lm.bin", NGRAM_BIN)); ngram_model_free(model); E_INFO("Converting BIN back to ARPA\n"); model = ngram_model_read(NULL, "100.tmp.lm.bin", NGRAM_BIN, lmath); test_lm_vals(model); TEST_EQUAL(0, ngram_model_write(model, "100.tmp.lm", NGRAM_ARPA)); ngram_model_free(model); E_INFO("Converting unigram ARPA to BIN\n"); model = ngram_model_read(NULL, LMDIR "/turtle.ug.lm", NGRAM_ARPA, lmath); TEST_EQUAL(0, ngram_model_write(model, "turtle.ug.tmp.lm.bin", NGRAM_BIN)); ngram_model_free(model); logmath_free(lmath); return 0; }