nlsplit

split natural language text in chunks at reasonable language boundaries
git clone https://a3nm.net/git/nlsplit/
Log | Files | Refs | README

commit 13ceb6bcc1c89f533d9ab3ccb19de9a060870e2a
parent 209fe4f6ff1c99fe5476f09581e50fa3bd2f8eae
Author: Antoine Amarilli <a3nm@a3nm.net>
Date:   Mon, 10 Oct 2011 00:09:02 +0200

change format

Diffstat:
nlsplit.c | 2+-
nlsplit_read.c | 2+-
2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/nlsplit.c b/nlsplit.c @@ -207,7 +207,7 @@ int split() { points[hd].position = offset + pos; } //printf("== %d %d\n", offset, pos); - printf("-- piece %d length %ld confidence %f\n", + printf("-- chunk %d length %ld confidence %f\n", npiece, points[hd].position - offset, points[hd].confidence); /* output the data */ for (i = offset; i < points[hd].position ; i++) diff --git a/nlsplit_read.c b/nlsplit_read.c @@ -42,7 +42,7 @@ int main(int argc, char **argv) { return E_MEMORY; } - while (scanf("-- piece %d length %d confidence %f", + while (scanf("-- chunk %d length %d confidence %f", &piece, &length, &confidence) == 3) { assert(piece == last_piece + 1); assert(length > 0);