commit - 653c9a034fe0f81fd93cc7a1fb1bb385490de085
commit + 6844db842719f3b3d1405a7295b0f8ab84c44094
blob - 4ad6403751a877d20ad880618d6cc3fc93c6c61a
blob + b98e7c5c1f4ac347c52696e83aae56e2865c1994
--- TODO
+++ TODO
+ - use p_textobj to produce the input for act_txtobj() in pdf.c which
+ implements the big text extraction algorithm. i don't want to replace that,
+ yet, just touch it up enough to work with these new parsers.
+ - make sure that the content operators have all their appropriate semantic
+ actions and validations attached.
+ - make a test case out of the example at the end of 8.7.9 (A85 with a leading
+ comment) to test just that strange "leading comment/whitespace" rule.
+
- fix the object stream parser to split input at logical boundaries, as
provided by the object index ("N pairs of integers") at the beginning of the
stream data.
blob - 5b8edc168b34b51da9769b8fcbc23fddd03de632
blob + f570c5bccfbd8bb726e3c0933616ad1775ad437d
--- content.c
+++ content.c
#define OP(SYM, PA, PN) \
H_RULE(op_ ## SYM, h_action(SEQ(PA, PN), act_op, (void *)OP_ ## SYM))
+ // XXX make sure that the operators below have all their appropriate
+ // semantic actions and validations attached.
+
/* compatibility operators (table 33) */
OP(BX, eps, KWD("BX"));
OP(EX, eps, KWD("EX"));