Issue 521 attachment: text-extract.cc (618 bytes)

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
#include "fpdf_text.h"
#include "fpdfview.h"

int main(int argc, char **argv) {
FPDF_InitLibrary();
FPDF_DOCUMENT doc = FPDF_LoadDocument(argv[1], NULL);
for (int i = 0; i < FPDF_GetPageCount(doc); i++) {
FPDF_PAGE page = FPDF_LoadPage(doc, i);
FPDF_TEXTPAGE textpage = FPDFText_LoadPage(page);
for (int j = 0; j <= FPDFText_CountChars(textpage); j++) {
unsigned int c = FPDFText_GetUnicode(textpage, j);
LOG(INFO) << "XXX character extracted: " << c;
}
FPDFText_ClosePage(textpage);
FPDF_ClosePage(page);
}
FPDF_CloseDocument(doc);
FPDF_DestroyLibrary();
return 0;
}