From e2b81ba87a27aa0e68a8971f8627dc91a4e77551 Mon Sep 17 00:00:00 2001 From: Bradley Skaggs Date: Sat, 6 Oct 2018 18:42:34 -0400 Subject: [PATCH] Fix file format documentation - document count and sizes are actually int64_t --- preprocess/dump_binary.cpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/preprocess/dump_binary.cpp b/preprocess/dump_binary.cpp index 89d172a..d626fbb 100755 --- a/preprocess/dump_binary.cpp +++ b/preprocess/dump_binary.cpp @@ -19,8 +19,8 @@ namespace lightlda { /* * Output file format: - * 1, the first 4 byte indicates the number of docs in this block - * 2, the 4 * (doc_num + 1) bytes indicate the offset of reach doc + * 1, the first 8 byte indicates the number of docs in this block + * 2, the 8 * (doc_num + 1) bytes indicate the offset of reach doc * an example * 3 // there are 3 docs in this block * 0 // the offset of the 1-st doc