commit 6844db842719f3b3d1405a7295b0f8ab84c44094 from: Sven M. Hallberg date: Sun Jul 02 15:51:55 2023 UTC content stream todos commit - 653c9a034fe0f81fd93cc7a1fb1bb385490de085 commit + 6844db842719f3b3d1405a7295b0f8ab84c44094 blob - 4ad6403751a877d20ad880618d6cc3fc93c6c61a blob + b98e7c5c1f4ac347c52696e83aae56e2865c1994 --- TODO +++ TODO @@ -1,3 +1,11 @@ + - use p_textobj to produce the input for act_txtobj() in pdf.c which + implements the big text extraction algorithm. i don't want to replace that, + yet, just touch it up enough to work with these new parsers. + - make sure that the content operators have all their appropriate semantic + actions and validations attached. + - make a test case out of the example at the end of 8.7.9 (A85 with a leading + comment) to test just that strange "leading comment/whitespace" rule. + - fix the object stream parser to split input at logical boundaries, as provided by the object index ("N pairs of integers") at the beginning of the stream data. blob - 5b8edc168b34b51da9769b8fcbc23fddd03de632 blob + f570c5bccfbd8bb726e3c0933616ad1775ad437d --- content.c +++ content.c @@ -286,6 +286,9 @@ init_content_parser(void) #define OP(SYM, PA, PN) \ H_RULE(op_ ## SYM, h_action(SEQ(PA, PN), act_op, (void *)OP_ ## SYM)) + // XXX make sure that the operators below have all their appropriate + // semantic actions and validations attached. + /* compatibility operators (table 33) */ OP(BX, eps, KWD("BX")); OP(EX, eps, KWD("EX"));