From 5a3b58d9dc997ef5ed1dfc5d41f1fe288c9c2765 Mon Sep 17 00:00:00 2001 From: Pompolic <pompolic@special-circumstanc.es> Date: Thu, 20 Feb 2020 22:09:27 +0100 Subject: [PATCH] Return HBytes Also a fix for a bug causing only one run to be parsed --- pdf.c | 37 +++++++++++++++++++++++++++++++++---- 1 file changed, 33 insertions(+), 4 deletions(-) diff --git a/pdf.c b/pdf.c index 06f920b..e053d85 100644 --- a/pdf.c +++ b/pdf.c @@ -456,7 +456,17 @@ act_dict_(const HParseResult *p, void *env) #define act_array_ h_act_flatten HParsedToken * -act_longlength(const HParseResult *p, void *env) +act_shortlength(const HParseResult *p, void *u) +{ + uint8_t length = H_CAST_UINT(p->ast); + /* Length can range from 0-127, corresponding to the range 1-128, inclusive */ + uint8_t finallength = length+1; + + return H_MAKE_UINT(finallength); +} + +HParsedToken * +act_longlength(const HParseResult *p, void *u) { uint8_t length = H_CAST_UINT(p->ast); uint8_t finallength = 257-length; @@ -465,7 +475,7 @@ act_longlength(const HParseResult *p, void *env) } HParsedToken * -act_longrun(const HParseResult *p, void *env) +act_longrun(const HParseResult *p, void *u) { HCountedArray *seq = H_CAST_SEQ(p->ast); HParsedToken **elements = h_seq_elements(p->ast); @@ -482,6 +492,25 @@ act_longrun(const HParseResult *p, void *env) return res; } +HParsedToken * +act_rldstring(const HParseResult *p, void *u) +{ + HCountedArray *seq = H_CAST_SEQ(p->ast); + const HCountedArray *flattened_seq = h_seq_flatten(p->arena, p->ast); + uint8_t bytes_required; + uint8_t *result_bytes; + + bytes_required = flattened_seq->used - 1; + result_bytes = h_arena_malloc(p->arena, sizeof(uint8_t) * bytes_required); + + for (size_t i = 0; i < flattened_seq->used-1; ++i) + { + result_bytes[i] = H_CAST_UINT(flattened_seq->elements[i]); + } + + return H_MAKE_BYTES(result_bytes, bytes_required); +} + /* * input grammar */ @@ -503,7 +532,7 @@ init_runlengthdecode_parser(struct Env *aux) { H_RULE(rldeod, h_ch(0x80)); H_ARULE(longlength, h_ch_range(0x81, 0xFF)); - H_RULE(shortlength, h_ch_range(0x1, 0x7F)); + H_ARULE(shortlength, h_ch_range(0x0, 0x7F)); H_RULE(shortdata, h_uint8()); H_RULE(longdata, h_uint8()); @@ -511,7 +540,7 @@ init_runlengthdecode_parser(struct Env *aux) H_RULE(shortrun, h_length_value(shortlength, shortdata)); H_ARULE(longrun, SEQ(longlength, longdata)); - H_RULE(rldstring, SEQ(CHX(shortrun, longrun), IGN(rldeod))); + H_ARULE(rldstring, SEQ(h_many(CHX(shortrun, longrun)), IGN(rldeod))); p_rldstring = rldstring; } -- GitLab