clamav/libclamav/pdfdecode.c

/*
 *  Copyright (C) 2016 Cisco and/or its affiliates. All rights reserved.
 *
 *  Author: Kevin Lin
 *
 *  This program is free software; you can redistribute it and/or modify
 *  it under the terms of the GNU General Public License version 2 as
 *  published by the Free Software Foundation.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU General Public License for more details.
 *
 *  You should have received a copy of the GNU General Public License
 *  along with this program; if not, write to the Free Software
 *  Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
 *  MA 02110-1301, USA.
 *
 *  In addition, as a special exception, the copyright holders give
 *  permission to link the code of portions of this program with the
 *  OpenSSL library under certain conditions as described in each
 *  individual source file, and distribute linked combinations
 *  including the two.
 *  
 *  You must obey the GNU General Public License in all respects
 *  for all of the code used other than OpenSSL.  If you modify
 *  file(s) with this exception, you may extend this exception to your
 *  version of the file(s), but you are not obligated to do so.  If you
 *  do not wish to do so, delete this exception statement from your
 *  version.  If you delete this exception statement from all source
 *  files in the program, then also delete it here.
 */

#if HAVE_CONFIG_H
#include "clamav-config.h"
#endif

#include <stdio.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <ctype.h>
#include <string.h>
#include <fcntl.h>
#include <stdlib.h>
#include <errno.h>
#ifdef	HAVE_LIMITS_H
#include <limits.h>
#endif
#ifdef	HAVE_UNISTD_H
#include <unistd.h>
#endif
#include <zlib.h>

#if HAVE_ICONV
#include <iconv.h>
#endif

#include "clamav.h"
#include "others.h"
#include "pdf.h"
#include "str.h"
#include "bytecode.h"
#include "bytecode_api.h"

struct pdf_token {
    uint32_t length;
    uint8_t *content;
};

static  int filter_ascii85decode(struct pdf_token *token);
//static  int filter_rldecode(struct pdf_token *token)
static  int filter_flatedecode(struct pdf_struct *pdf, struct pdf_obj *obj, struct pdf_token *token);
static  int filter_asciihexdecode(struct pdf_token *token);

static  int pdf_decodestream_internal(struct pdf_struct *pdf, struct pdf_obj *obj, struct pdf_token *token);

int pdf_decodestream(struct pdf_struct *pdf, struct pdf_obj *obj, const char *stream, uint32_t streamlen, int fout)
{
    struct pdf_token *token;
    int rc;

    if (!stream || fout < 0 || !obj->numfilters) {
        cli_dbgmsg("nothing to decode\n");
        return CL_ENULLARG;
    }

    token = cli_malloc(sizeof(struct pdf_token));
    if (!token)
        return CL_EMEM;

    token->content = cli_malloc(streamlen);
    if (!token->content) {
        free(token);
        return CL_EMEM;
    }
    memcpy(token->content, stream, streamlen);
    token->length = streamlen;

    rc = pdf_decodestream_internal(pdf, obj, token);

    if (rc == CL_SUCCESS) {
        cli_dbgmsg("cli_pdf: decoding SUCCESS!\n");

        if (!cli_checklimits("pdf", pdf->ctx, token->length, 0, 0))
            rc = cli_writen(fout, token->content, token->length);
    }

    free(token->content);
    free(token);
    return rc;
}

static int pdf_decodestream_internal(struct pdf_struct *pdf, struct pdf_obj *obj, struct pdf_token *token)
{
    int i, rc;

    cli_dbgmsg("cli_pdf: detected %lu filters applied\n", (long unsigned)(obj->numfilters));

    /* TODO - MAY BE SUBJECT TO CHANGE */
    for (i = 0; i < obj->numfilters; i++) {
        switch(obj->filterlist[i]) {
        case OBJ_FILTER_A85:
            cli_dbgmsg("cli_pdf: decoding [%d] => ASCII85DECODE\n", obj->filterlist[i]);
            rc = filter_ascii85decode(token);
            break;

        case OBJ_FILTER_FLATE:
            cli_dbgmsg("cli_pdf: decoding [%d] => FLATEDECODE\n", obj->filterlist[i]);
            rc = filter_flatedecode(pdf, obj, token);
            break;

        case OBJ_FILTER_AH:
            cli_dbgmsg("cli_pdf: decoding [%d] => ASCIIHEXDECODE\n", obj->filterlist[i]);
            rc = filter_asciihexdecode(token);
            break;

        case OBJ_FILTER_RL:
        case OBJ_FILTER_JPX:
        case OBJ_FILTER_DCT: //OBJ_FILTER_JBIG2
        case OBJ_FILTER_LZW:
        case OBJ_FILTER_FAX:
        case OBJ_FILTER_CRYPT:

        default:
            cli_warnmsg("cli_pdf: unknown filter type [%d].\n", obj->filterlist[i]);
            break;
        }

        /*TODO: check rc value*/
        /*TODO: check content field*/
        /*TODO: check length value*/
        /*IF INTERMEDIATE DUMPING - PUT HERE*/
    }

    return CL_SUCCESS;
}

static int filter_ascii85decode(struct pdf_token *token)
{
    uint8_t *decoded;
    uint32_t declen = 0;

    const uint8_t *ptr = (uint8_t *)token->content;
    uint32_t remaining = token->length;
    int quintet = 0, rc = CL_SUCCESS;
    uint64_t sum = 0;

    /* 5:4 decoding ratio - (5*length), ((length/5+1)*4), (((x+4)/5)*4) */
    if (!(decoded = (uint8_t *)cli_malloc(((remaining+4)/5)*4))) {
        cli_errmsg("cli_pdf: cannot allocate memory for decoded output\n");
        return CL_EMEM;
    }

    if(cli_memstr(ptr, remaining, "~>", 2) == NULL)
        cli_dbgmsg("cli_pdf: no EOF marker found\n");

    cli_dbgmsg("cli_pdf: %lu bytes remaining\n", (unsigned long)remaining);

    while (remaining > 0) {
        int byte = (remaining--) ? (int)*ptr++ : EOF;

        if((byte == '~') && (remaining > 0) && (*ptr == '>'))
            byte = EOF;

        if(byte >= '!' && byte <= 'u') {
            sum = (sum * 85) + ((uint32_t)byte - '!');
            if(++quintet == 5) {
                *decoded++ = (unsigned char)(sum >> 24);
                *decoded++ = (unsigned char)((sum >> 16) & 0xFF);
                *decoded++ = (unsigned char)((sum >> 8) & 0xFF);
                *decoded++ = (unsigned char)(sum & 0xFF);

                declen += 4;
                quintet = 0;
                sum = 0;
            }
        } else if(byte == 'z') {
            if(quintet) {
                cli_dbgmsg("cli_pdf: unexpected 'z'\n");
                rc = CL_EFORMAT;
                break;
            }

            *decoded++ = '\0';
            *decoded++ = '\0';
            *decoded++ = '\0';
            *decoded++ = '\0';

            declen += 4;
        } else if(byte == EOF) {
            cli_dbgmsg("cli_pdf: %d bytes remaining in last quintet\n", quintet);
            if(quintet) {
                int i;

                if(quintet == 1) {
                    cli_dbgmsg("cli_pdf: only 1 byte in last quintet\n");
                    rc = CL_EFORMAT;
                    break;
                }

                for(i = quintet; i < 5; i++)
                    sum *= 85;

                if(quintet > 1)
                    sum += (0xFFFFFF >> ((quintet - 2) * 8));

                for(i = 0; i < quintet - 1; i++)
                    *decoded++ = (uint8_t)((sum >> (24 - 8 * i)) & 0xFF);
                declen += quintet-1;
            }

            break;
        } else if(!isspace(byte)) {
            cli_dbgmsg("cli_pdf: invalid character 0x%x @ %lu\n",
                       byte & 0xFF, (unsigned long)(token->length-remaining));

            rc = CL_EFORMAT;
            break;
        }
    }

    if (rc == CL_SUCCESS) {
        free(token->content);

        cli_dbgmsg("cli_pdf: deflated %lu bytes from %lu total bytes\n",
                   (unsigned long)declen, (unsigned long)(token->length));

        token->content = decoded;
        token->length = declen;
    } else {
        cli_errmsg("cli_pdf: error occurred parsing byte %lu of %lu\n",
                   (unsigned long)(token->length-remaining), (unsigned long)(token->length));
        free(decoded);
    }
    return rc;
}

/*
static int filter_rldecode(struct pdf_token *token)
{
}
*/

static uint8_t *decode_nextlinestart(uint8_t *content, uint32_t length)
{
    uint8_t *pt = content;
    uint32_t r;
    int toggle = 0;

    for (r = 0; r < length; r++, pt++) {
        if (*pt == '\n' || *pt == '\r')
            toggle = 1;
        else if (toggle)
            break;
    }

    return pt;
}

static int filter_flatedecode(struct pdf_struct *pdf, struct pdf_obj *obj, struct pdf_token *token)
{
    uint8_t *decoded, *temp;
    uint32_t declen = 0, capacity = 0;

    uint8_t *content = (uint8_t *)token->content;
    uint32_t length = token->length;
    z_stream stream;
    int zstat, skip = 0, rc = CL_SUCCESS;

    if (length == 0)
        return CL_CLEAN;

    if (*content == '\r') {
        content++;
        length--;
        //pdfobj_flag(pdf, obj, BAD_STREAMSTART);
        /* PDF spec says stream is followed by \r\n or \n, but not \r alone.
         * Sample 0015315109, it has \r followed by zlib header.
         * Flag pdf as suspicious, and attempt to extract by skipping the \r.
         */
        if (!length)
            return CL_CLEAN;
    }

    if (!(decoded = (uint8_t *)cli_calloc(BUFSIZ, sizeof(uint8_t)))) {
        cli_errmsg("cli_pdf: cannot allocate memory for decoded output\n");
        return CL_EMEM;
    }
    capacity = BUFSIZ;

    memset(&stream, 0, sizeof(stream));
    stream.next_in = (Bytef *)content;
    stream.avail_in = length;
    stream.next_out = (Bytef *)decoded;
    stream.avail_out = BUFSIZ;

    zstat = inflateInit(&stream);
    if(zstat != Z_OK) {
        cli_warnmsg("cli_pdf: inflateInit failed\n");
        free(decoded);
        return CL_EMEM;
    }

    /* initial inflate */
    zstat = inflate(&stream, Z_NO_FLUSH);
    /* check if nothing written whatsoever */
    if ((zstat != Z_OK) && (stream.avail_out == BUFSIZ)) {
        /* skip till EOL, and try inflating from there, sometimes
         * PDFs contain extra whitespace */
        uint8_t *q = decode_nextlinestart(content, length);
        if (q) {
            (void)inflateEnd(&stream);
            length -= q - content;
            content = q;

            stream.next_in = (Bytef *)content;
            stream.avail_in = length;
            stream.next_out = (Bytef *)decoded;
            stream.avail_out = capacity;

            zstat = inflateInit(&stream);
            if(zstat != Z_OK) {
                cli_warnmsg("cli_pdf: inflateInit failed\n");
                free(decoded);
                return CL_EMEM;
            }

            //pdfobj_flag(pdf, obj, BAD_FLATESTART);
        }

        zstat = inflate(&stream, Z_NO_FLUSH);
    }

    while (zstat == Z_OK && stream.avail_in) {
        /* extend output capacity if needed, TODO - limit check */
        if(stream.avail_out == 0) {
            if(stream.avail_out == 0) {
                if (!(temp = cli_realloc(decoded, capacity + BUFSIZ))) {
                    cli_errmsg("cli_pdf: cannot reallocate memory for decoded output\n");
                    rc = CL_EMEM;
                    break;
                }
                decoded = temp;
                stream.next_out = decoded + capacity;
                stream.avail_out = BUFSIZ;
                declen += BUFSIZ;
                capacity += BUFSIZ;
            }
        }

        /* continue inflation */
        zstat = inflate(&stream, Z_NO_FLUSH);
    }

    /* add stream end fragment to decoded length */
    declen += (BUFSIZ - stream.avail_out);

    /* error handling */
    switch(zstat) {
    case Z_OK:
        cli_dbgmsg("cli_pdf: Z_OK on stream inflation completion\n");
        /* intentional fall-through */
    case Z_STREAM_END:
        cli_dbgmsg("cli_pdf: inflated %lu bytes from %lu total bytes (%lu bytes remaining)\n",
                   (unsigned long)declen, (unsigned long)(token->length), (unsigned long)(stream.avail_in));
        break;

    /* potentially fatal - *mostly* ignored as per older version */
    case Z_STREAM_ERROR:
    case Z_NEED_DICT:
    case Z_DATA_ERROR:
    case Z_MEM_ERROR:
    default:
        if(stream.msg)
            cli_dbgmsg("cli_pdf: after writing %lu bytes, got error \"%s\" inflating PDF stream in %u %u obj\n",
                       (unsigned long)declen, stream.msg, obj->id>>8, obj->id&0xff);
        else
            cli_dbgmsg("cli_pdf: after writing %lu bytes, got error %d inflating PDF stream in %u %u obj\n",
                       (unsigned long)declen, zstat, obj->id>>8, obj->id&0xff);

        if (declen == 0) {
            //pdfobj_flag(pdf, obj, BAD_FLATESTART);
            cli_dbgmsg("cli_pdf: no bytes were inflated.\n");

            rc = CL_EFORMAT;
        } else {
            //pdfobj_flag(pdf, obj, BAD_FLATE);
        }
        break;
    }

    (void)inflateEnd(&stream);

    if (rc == CL_SUCCESS) {
        free(token->content);

        token->content = decoded;
        token->length = declen;
    } else {
        cli_errmsg("cli_pdf: error occurred parsing byte %lu of %lu\n",
                   (unsigned long)(length-stream.avail_in), (unsigned long)(token->length));
        free(decoded);
    }

    return rc;
}

static int filter_asciihexdecode(struct pdf_token *token)
{
    uint8_t *decoded;

    const uint8_t *content = (uint8_t *)token->content;
    uint32_t length = token->length;
    uint32_t i, j;
    int rc = CL_SUCCESS;

    if (!(decoded = (uint8_t *)cli_calloc(length/2 + 1, sizeof(uint8_t)))) {
        cli_errmsg("cli_pdf: cannot allocate memory for decoded output\n");
        return CL_EMEM;
    }

    for (i = 0, j = 0; i+1 < length; i++) {
        if (content[i] == ' ')
            continue;

        if (content[i] == '>')
            break;

        if (cli_hex2str_to(content+i, decoded+j, 2) == -1) {
            if (length - i < 4)
                continue;

            rc = CL_EFORMAT;
            break;
        }

        i++;
        j++;
    }

    if (rc == CL_SUCCESS) {
        free(token->content);

        cli_dbgmsg("cli_pdf: deflated %lu bytes from %lu total bytes\n",
                   (unsigned long)j, (unsigned long)(token->length));

        token->content = decoded;
        token->length = j;
    } else {
        cli_errmsg("cli_pdf: error occurred parsing byte %lu of %lu\n",
                   (unsigned long)i, (unsigned long)(token->length));
        free(decoded);
    }
    return rc;
}
pdfdecode: add new source for stream decoding (ascii85, asciihex, flate) 2016-03-28 11:53:40 -04:00			`/*`
			`* Copyright (C) 2016 Cisco and/or its affiliates. All rights reserved.`
			`*`
			`* Author: Kevin Lin`
			`*`
			`* This program is free software; you can redistribute it and/or modify`
			`* it under the terms of the GNU General Public License version 2 as`
			`* published by the Free Software Foundation.`
			`*`
			`* This program is distributed in the hope that it will be useful,`
			`* but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`* GNU General Public License for more details.`
			`*`
			`* You should have received a copy of the GNU General Public License`
			`* along with this program; if not, write to the Free Software`
			`* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,`
			`* MA 02110-1301, USA.`
			`*`
			`* In addition, as a special exception, the copyright holders give`
			`* permission to link the code of portions of this program with the`
			`* OpenSSL library under certain conditions as described in each`
			`* individual source file, and distribute linked combinations`
			`* including the two.`
			`*`
			`* You must obey the GNU General Public License in all respects`
			`* for all of the code used other than OpenSSL. If you modify`
			`* file(s) with this exception, you may extend this exception to your`
			`* version of the file(s), but you are not obligated to do so. If you`
			`* do not wish to do so, delete this exception statement from your`
			`* version. If you delete this exception statement from all source`
			`* files in the program, then also delete it here.`
			`*/`

			`#if HAVE_CONFIG_H`
			`#include "clamav-config.h"`
			`#endif`

			`#include <stdio.h>`
			`#include <sys/types.h>`
			`#include <sys/stat.h>`
			`#include <ctype.h>`
			`#include <string.h>`
			`#include <fcntl.h>`
			`#include <stdlib.h>`
			`#include <errno.h>`
			`#ifdef HAVE_LIMITS_H`
			`#include <limits.h>`
			`#endif`
			`#ifdef HAVE_UNISTD_H`
			`#include <unistd.h>`
			`#endif`
			`#include <zlib.h>`

			`#if HAVE_ICONV`
			`#include <iconv.h>`
			`#endif`

			`#include "clamav.h"`
			`#include "others.h"`
			`#include "pdf.h"`
			`#include "str.h"`
			`#include "bytecode.h"`
			`#include "bytecode_api.h"`

			`struct pdf_token {`
			`uint32_t length;`
			`uint8_t *content;`
			`};`

			`static int filter_ascii85decode(struct pdf_token *token);`
			`//static int filter_rldecode(struct pdf_token *token)`
			`static int filter_flatedecode(struct pdf_struct pdf, struct pdf_obj obj, struct pdf_token *token);`
			`static int filter_asciihexdecode(struct pdf_token *token);`

			`static int pdf_decodestream_internal(struct pdf_struct pdf, struct pdf_obj obj, struct pdf_token *token);`

			`int pdf_decodestream(struct pdf_struct pdf, struct pdf_obj obj, const char *stream, uint32_t streamlen, int fout)`
			`{`
			`struct pdf_token *token;`
			`int rc;`

			`if (!stream \|\| fout < 0 \|\| !obj->numfilters) {`
			`cli_dbgmsg("nothing to decode\n");`
			`return CL_ENULLARG;`
			`}`

			`token = cli_malloc(sizeof(struct pdf_token));`
			`if (!token)`
			`return CL_EMEM;`

			`token->content = cli_malloc(streamlen);`
			`if (!token->content) {`
			`free(token);`
			`return CL_EMEM;`
			`}`
			`memcpy(token->content, stream, streamlen);`
			`token->length = streamlen;`

			`rc = pdf_decodestream_internal(pdf, obj, token);`

			`if (rc == CL_SUCCESS) {`
			`cli_dbgmsg("cli_pdf: decoding SUCCESS!\n");`

			`if (!cli_checklimits("pdf", pdf->ctx, token->length, 0, 0))`
			`rc = cli_writen(fout, token->content, token->length);`
			`}`

			`free(token->content);`
			`free(token);`
			`return rc;`
			`}`

			`static int pdf_decodestream_internal(struct pdf_struct pdf, struct pdf_obj obj, struct pdf_token *token)`
			`{`
			`int i, rc;`

			`cli_dbgmsg("cli_pdf: detected %lu filters applied\n", (long unsigned)(obj->numfilters));`

			`/* TODO - MAY BE SUBJECT TO CHANGE */`
			`for (i = 0; i < obj->numfilters; i++) {`
			`switch(obj->filterlist[i]) {`
			`case OBJ_FILTER_A85:`
			`cli_dbgmsg("cli_pdf: decoding [%d] => ASCII85DECODE\n", obj->filterlist[i]);`
			`rc = filter_ascii85decode(token);`
			`break;`

			`case OBJ_FILTER_FLATE:`
			`cli_dbgmsg("cli_pdf: decoding [%d] => FLATEDECODE\n", obj->filterlist[i]);`
			`rc = filter_flatedecode(pdf, obj, token);`
			`break;`

			`case OBJ_FILTER_AH:`
			`cli_dbgmsg("cli_pdf: decoding [%d] => ASCIIHEXDECODE\n", obj->filterlist[i]);`
			`rc = filter_asciihexdecode(token);`
			`break;`

			`case OBJ_FILTER_RL:`
			`case OBJ_FILTER_JPX:`
			`case OBJ_FILTER_DCT: //OBJ_FILTER_JBIG2`
			`case OBJ_FILTER_LZW:`
			`case OBJ_FILTER_FAX:`
			`case OBJ_FILTER_CRYPT:`

			`default:`
			`cli_warnmsg("cli_pdf: unknown filter type [%d].\n", obj->filterlist[i]);`
			`break;`
			`}`

			`/TODO: check rc value/`
			`/TODO: check content field/`
			`/TODO: check length value/`
			`/IF INTERMEDIATE DUMPING - PUT HERE/`
			`}`

			`return CL_SUCCESS;`
			`}`

			`static int filter_ascii85decode(struct pdf_token *token)`
			`{`
			`uint8_t *decoded;`
			`uint32_t declen = 0;`

			`const uint8_t ptr = (uint8_t )token->content;`
			`uint32_t remaining = token->length;`
			`int quintet = 0, rc = CL_SUCCESS;`
			`uint64_t sum = 0;`

			`/* 5:4 decoding ratio - (5length), ((length/5+1)4), (((x+4)/5)4) /`
			`if (!(decoded = (uint8_t )cli_malloc(((remaining+4)/5)4))) {`
			`cli_errmsg("cli_pdf: cannot allocate memory for decoded output\n");`
			`return CL_EMEM;`
			`}`

			`if(cli_memstr(ptr, remaining, "~>", 2) == NULL)`
			`cli_dbgmsg("cli_pdf: no EOF marker found\n");`

			`cli_dbgmsg("cli_pdf: %lu bytes remaining\n", (unsigned long)remaining);`

			`while (remaining > 0) {`
			`int byte = (remaining--) ? (int)*ptr++ : EOF;`

			`if((byte == '~') && (remaining > 0) && (*ptr == '>'))`
			`byte = EOF;`

			`if(byte >= '!' && byte <= 'u') {`
			`sum = (sum * 85) + ((uint32_t)byte - '!');`
			`if(++quintet == 5) {`
			`*decoded++ = (unsigned char)(sum >> 24);`
			`*decoded++ = (unsigned char)((sum >> 16) & 0xFF);`
			`*decoded++ = (unsigned char)((sum >> 8) & 0xFF);`
			`*decoded++ = (unsigned char)(sum & 0xFF);`

			`declen += 4;`
			`quintet = 0;`
			`sum = 0;`
			`}`
			`} else if(byte == 'z') {`
			`if(quintet) {`
			`cli_dbgmsg("cli_pdf: unexpected 'z'\n");`
			`rc = CL_EFORMAT;`
			`break;`
			`}`

			`*decoded++ = '\0';`
			`*decoded++ = '\0';`
			`*decoded++ = '\0';`
			`*decoded++ = '\0';`

			`declen += 4;`
			`} else if(byte == EOF) {`
			`cli_dbgmsg("cli_pdf: %d bytes remaining in last quintet\n", quintet);`
			`if(quintet) {`
			`int i;`

			`if(quintet == 1) {`
			`cli_dbgmsg("cli_pdf: only 1 byte in last quintet\n");`
			`rc = CL_EFORMAT;`
			`break;`
			`}`

			`for(i = quintet; i < 5; i++)`
			`sum *= 85;`

			`if(quintet > 1)`
			`sum += (0xFFFFFF >> ((quintet - 2) * 8));`

			`for(i = 0; i < quintet - 1; i++)`
			`decoded++ = (uint8_t)((sum >> (24 - 8 i)) & 0xFF);`
			`declen += quintet-1;`
			`}`

			`break;`
			`} else if(!isspace(byte)) {`
			`cli_dbgmsg("cli_pdf: invalid character 0x%x @ %lu\n",`
			`byte & 0xFF, (unsigned long)(token->length-remaining));`

			`rc = CL_EFORMAT;`
			`break;`
			`}`
			`}`

			`if (rc == CL_SUCCESS) {`
			`free(token->content);`

			`cli_dbgmsg("cli_pdf: deflated %lu bytes from %lu total bytes\n",`
			`(unsigned long)declen, (unsigned long)(token->length));`

			`token->content = decoded;`
			`token->length = declen;`
			`} else {`
			`cli_errmsg("cli_pdf: error occurred parsing byte %lu of %lu\n",`
			`(unsigned long)(token->length-remaining), (unsigned long)(token->length));`
			`free(decoded);`
			`}`
			`return rc;`
			`}`

			`/*`
			`static int filter_rldecode(struct pdf_token *token)`
			`{`
			`}`
			`*/`

			`static uint8_t decode_nextlinestart(uint8_t content, uint32_t length)`
			`{`
			`uint8_t *pt = content;`
			`uint32_t r;`
			`int toggle = 0;`

			`for (r = 0; r < length; r++, pt++) {`
			`if (pt == '\n' \|\| pt == '\r')`
			`toggle = 1;`
			`else if (toggle)`
			`break;`
			`}`

			`return pt;`
			`}`

			`static int filter_flatedecode(struct pdf_struct pdf, struct pdf_obj obj, struct pdf_token *token)`
			`{`
			`uint8_t decoded, temp;`
			`uint32_t declen = 0, capacity = 0;`

			`uint8_t content = (uint8_t )token->content;`
			`uint32_t length = token->length;`
			`z_stream stream;`
			`int zstat, skip = 0, rc = CL_SUCCESS;`

			`if (length == 0)`
			`return CL_CLEAN;`

			`if (*content == '\r') {`
			`content++;`
			`length--;`
			`//pdfobj_flag(pdf, obj, BAD_STREAMSTART);`
			`/* PDF spec says stream is followed by \r\n or \n, but not \r alone.`
			`* Sample 0015315109, it has \r followed by zlib header.`
			`* Flag pdf as suspicious, and attempt to extract by skipping the \r.`
			`*/`
			`if (!length)`
			`return CL_CLEAN;`
			`}`

			`if (!(decoded = (uint8_t *)cli_calloc(BUFSIZ, sizeof(uint8_t)))) {`
			`cli_errmsg("cli_pdf: cannot allocate memory for decoded output\n");`
			`return CL_EMEM;`
			`}`
			`capacity = BUFSIZ;`

			`memset(&stream, 0, sizeof(stream));`
			`stream.next_in = (Bytef *)content;`
			`stream.avail_in = length;`
			`stream.next_out = (Bytef *)decoded;`
			`stream.avail_out = BUFSIZ;`

			`zstat = inflateInit(&stream);`
			`if(zstat != Z_OK) {`
			`cli_warnmsg("cli_pdf: inflateInit failed\n");`
			`free(decoded);`
			`return CL_EMEM;`
			`}`

			`/* initial inflate */`
			`zstat = inflate(&stream, Z_NO_FLUSH);`
			`/* check if nothing written whatsoever */`
			`if ((zstat != Z_OK) && (stream.avail_out == BUFSIZ)) {`
			`/* skip till EOL, and try inflating from there, sometimes`
			`* PDFs contain extra whitespace */`
			`uint8_t *q = decode_nextlinestart(content, length);`
			`if (q) {`
			`(void)inflateEnd(&stream);`
			`length -= q - content;`
			`content = q;`

			`stream.next_in = (Bytef *)content;`
			`stream.avail_in = length;`
			`stream.next_out = (Bytef *)decoded;`
			`stream.avail_out = capacity;`

			`zstat = inflateInit(&stream);`
			`if(zstat != Z_OK) {`
			`cli_warnmsg("cli_pdf: inflateInit failed\n");`
			`free(decoded);`
			`return CL_EMEM;`
			`}`

			`//pdfobj_flag(pdf, obj, BAD_FLATESTART);`
			`}`

			`zstat = inflate(&stream, Z_NO_FLUSH);`
			`}`

			`while (zstat == Z_OK && stream.avail_in) {`
			`/* extend output capacity if needed, TODO - limit check */`
			`if(stream.avail_out == 0) {`
			`if(stream.avail_out == 0) {`
			`if (!(temp = cli_realloc(decoded, capacity + BUFSIZ))) {`
			`cli_errmsg("cli_pdf: cannot reallocate memory for decoded output\n");`
			`rc = CL_EMEM;`
			`break;`
			`}`
			`decoded = temp;`
			`stream.next_out = decoded + capacity;`
			`stream.avail_out = BUFSIZ;`
			`declen += BUFSIZ;`
			`capacity += BUFSIZ;`
			`}`
			`}`

			`/* continue inflation */`
			`zstat = inflate(&stream, Z_NO_FLUSH);`
			`}`

			`/* add stream end fragment to decoded length */`
			`declen += (BUFSIZ - stream.avail_out);`

			`/* error handling */`
			`switch(zstat) {`
			`case Z_OK:`
			`cli_dbgmsg("cli_pdf: Z_OK on stream inflation completion\n");`
			`/* intentional fall-through */`
			`case Z_STREAM_END:`
			`cli_dbgmsg("cli_pdf: inflated %lu bytes from %lu total bytes (%lu bytes remaining)\n",`
			`(unsigned long)declen, (unsigned long)(token->length), (unsigned long)(stream.avail_in));`
			`break;`

			`/* potentially fatal - mostly ignored as per older version */`
			`case Z_STREAM_ERROR:`
			`case Z_NEED_DICT:`
			`case Z_DATA_ERROR:`
			`case Z_MEM_ERROR:`
			`default:`
			`if(stream.msg)`
			`cli_dbgmsg("cli_pdf: after writing %lu bytes, got error \"%s\" inflating PDF stream in %u %u obj\n",`
			`(unsigned long)declen, stream.msg, obj->id>>8, obj->id&0xff);`
			`else`
			`cli_dbgmsg("cli_pdf: after writing %lu bytes, got error %d inflating PDF stream in %u %u obj\n",`
			`(unsigned long)declen, zstat, obj->id>>8, obj->id&0xff);`

			`if (declen == 0) {`
			`//pdfobj_flag(pdf, obj, BAD_FLATESTART);`
			`cli_dbgmsg("cli_pdf: no bytes were inflated.\n");`

			`rc = CL_EFORMAT;`
			`} else {`
			`//pdfobj_flag(pdf, obj, BAD_FLATE);`
			`}`
			`break;`
			`}`

			`(void)inflateEnd(&stream);`

			`if (rc == CL_SUCCESS) {`
			`free(token->content);`

			`token->content = decoded;`
			`token->length = declen;`
			`} else {`
			`cli_errmsg("cli_pdf: error occurred parsing byte %lu of %lu\n",`
			`(unsigned long)(length-stream.avail_in), (unsigned long)(token->length));`
			`free(decoded);`
			`}`

			`return rc;`
			`}`

			`static int filter_asciihexdecode(struct pdf_token *token)`
			`{`
			`uint8_t *decoded;`

			`const uint8_t content = (uint8_t )token->content;`
			`uint32_t length = token->length;`
			`uint32_t i, j;`
			`int rc = CL_SUCCESS;`

			`if (!(decoded = (uint8_t *)cli_calloc(length/2 + 1, sizeof(uint8_t)))) {`
			`cli_errmsg("cli_pdf: cannot allocate memory for decoded output\n");`
			`return CL_EMEM;`
			`}`

			`for (i = 0, j = 0; i+1 < length; i++) {`
			`if (content[i] == ' ')`
			`continue;`

			`if (content[i] == '>')`
			`break;`

			`if (cli_hex2str_to(content+i, decoded+j, 2) == -1) {`
			`if (length - i < 4)`
			`continue;`

			`rc = CL_EFORMAT;`
			`break;`
			`}`

			`i++;`
			`j++;`
			`}`

			`if (rc == CL_SUCCESS) {`
			`free(token->content);`

			`cli_dbgmsg("cli_pdf: deflated %lu bytes from %lu total bytes\n",`
			`(unsigned long)j, (unsigned long)(token->length));`

			`token->content = decoded;`
			`token->length = j;`
			`} else {`
			`cli_errmsg("cli_pdf: error occurred parsing byte %lu of %lu\n",`
			`(unsigned long)i, (unsigned long)(token->length));`
			`free(decoded);`
			`}`
			`return rc;`
			`}`