summaryrefslogtreecommitdiffstats
path: root/app/HyphTool.cpp
blob: 730abadcbaf2b9658fdc896359b38314e46eb822 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
#include <stdio.h>
#include <sys/stat.h>
#include <string.h>

#include "utils/Log.h"

#include <vector>
#include <minikin/Hyphenator.h>

using android::Hyphenator;

Hyphenator* loadHybFile(const char* fn) {
    struct stat statbuf;
    int status = stat(fn, &statbuf);
    if (status < 0) {
        fprintf(stderr, "error opening %s\n", fn);
        return nullptr;
    }
    size_t size = statbuf.st_size;
    FILE* f = fopen(fn, "rb");
    if (f == NULL) {
        fprintf(stderr, "error opening %s\n", fn);
        return nullptr;
    }
    uint8_t* buf = new uint8_t[size];
    size_t read_size = fread(buf, 1, size, f);
    if (read_size < size) {
        fprintf(stderr, "error reading %s\n", fn);
        delete[] buf;
        return nullptr;
    }
    return Hyphenator::loadBinary(buf);
}

int main(int argc, char** argv) {
    Hyphenator* hyph = loadHybFile("/tmp/en.hyb");  // should also be configurable
    std::vector<uint8_t> result;
    std::vector<uint16_t> word;
    if (argc < 2) {
        fprintf(stderr, "usage: hyphtool word\n");
        return 1;
    }
    char* asciiword = argv[1];
    size_t len = strlen(asciiword);
    for (size_t i = 0; i < len; i++) {
        uint32_t c = asciiword[i];
        if (c == '-') {
            c = 0x00AD;
        }
        // ASCII (or possibly ISO Latin 1), but kinda painful to do utf conversion :(
        word.push_back(c);
    }
    hyph->hyphenate(&result, word.data(), word.size());
    for (size_t i = 0; i < len; i++) {
        if (result[i] != 0) {
            printf("-");
        }
        printf("%c", word[i]);
    }
    printf("\n");
    return 0;
}