[Python-modules-commits] [python-sabyenc] 01/02: commmit merge

JCF Ploemen jcfp-guest at moszumanska.debian.org
Tue Jan 2 10:47:40 UTC 2018


This is an automated email from the git hooks/post-receive script.

jcfp-guest pushed a commit to branch upstream
in repository python-sabyenc.

commit 28027d631f3fa4e44bf3e4ccfe0bd9fc1e917d4e
Merge: 1a9c1e3 17bb32d
Author: JCF Ploemen (jcfp) <linux at jcf.pm>
Date:   Tue Jan 2 11:35:17 2018 +0100

    commmit merge

 setup.py      |  122 +++---
 src/sabyenc.c | 1245 +++++++++++++++++++++++++++++----------------------------
 src/sabyenc.h |  100 ++---
 3 files changed, 734 insertions(+), 733 deletions(-)

diff --cc setup.py
index f49e15d,403c594..34cd777
--- a/setup.py
+++ b/setup.py
@@@ -1,61 -1,61 +1,61 @@@
--#!/usr/bin/env python
--# -*- coding: utf-8 -*-
--##=============================================================================
-- #
-- # Copyright (C) 2003, 2011 Alessandro Duca <alessandro.duca at gmail.com>
-- # Modified in 2016 by Safihre <safihre at sabnzbd.org> for use within SABnzbd
-- #
-- # This library is free software; you can redistribute it and/or
-- # modify it under the terms of the GNU Lesser General Public
-- # License as published by the Free Software Foundation; either
-- # version 2.1 of the License, or (at your option) any later version.
-- #
-- # This library is distributed in the hope that it will be useful,
-- # but WITHOUT ANY WARRANTY; without even the implied warranty of
-- # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
-- # Lesser General Public License for more details.
-- #
-- # You should have received a copy of the GNU Lesser General Public
-- # License along with this library; if not, write to the Free Software
-- # Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
-- #=============================================================================
-- #
--##=============================================================================
--
--from setuptools import setup, Extension
--
--setup(
--    name            = "sabyenc",
-     version         = "3.3.2",
 -    version         = "3.3.1",
--    author          = "Safihre",
--    author_email    = "safihre at sabnzbd.org",
--    url             = "https://github.com/sabnzbd/sabnzbd-yenc",
--    license         = "LGPLv3",
--    package_dir     = {'sabyenc': 'src'},
--    ext_modules     = [Extension("sabyenc", ["src/sabyenc.c"])],
--    classifiers     = [
--        "Programming Language :: Python",
--        "Programming Language :: Python :: 2.7",
--        "Programming Language :: C",
--        "License :: OSI Approved :: GNU Lesser General Public License v3 (LGPLv3)",
--        "Operating System :: Unix",
--        "Development Status :: 5 - Production/Stable",
--        "Environment :: Plugins",
--        "Topic :: Software Development :: Libraries :: Python Modules",
--        "Topic :: Communications :: Usenet News"
--    ],
--    description     = "yEnc Module for Python modified for SABnzbd",
--    long_description = """
--yEnc Decoding for Python
-----------------------------------
--
--Mofied the original yenc module by Alessandro Duca for use within SABnzbd.
--
--The module was extended to do header parsing and full yEnc decoding from a Python
--list of chunks, the way in which data is retrieved from usenet.
--
--Currently CRC-checking of decoded data is disabled to allow for increased performance.
--It can only be re-enabled by locally altering 'sabyenc.h' and setting 'CRC_CHECK 1'.
--"""
--)
--
++#!/usr/bin/env python
++# -*- coding: utf-8 -*-
++##=============================================================================
++ #
++ # Copyright (C) 2003, 2011 Alessandro Duca <alessandro.duca at gmail.com>
++ # Modified in 2016 by Safihre <safihre at sabnzbd.org> for use within SABnzbd
++ #
++ # This library is free software; you can redistribute it and/or
++ # modify it under the terms of the GNU Lesser General Public
++ # License as published by the Free Software Foundation; either
++ # version 2.1 of the License, or (at your option) any later version.
++ #
++ # This library is distributed in the hope that it will be useful,
++ # but WITHOUT ANY WARRANTY; without even the implied warranty of
++ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
++ # Lesser General Public License for more details.
++ #
++ # You should have received a copy of the GNU Lesser General Public
++ # License along with this library; if not, write to the Free Software
++ # Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
++ #=============================================================================
++ #
++##=============================================================================
++
++from setuptools import setup, Extension
++
++setup(
++    name            = "sabyenc",
++    version         = "3.3.2",
++    author          = "Safihre",
++    author_email    = "safihre at sabnzbd.org",
++    url             = "https://github.com/sabnzbd/sabnzbd-yenc",
++    license         = "LGPLv3",
++    package_dir     = {'sabyenc': 'src'},
++    ext_modules     = [Extension("sabyenc", ["src/sabyenc.c"])],
++    classifiers     = [
++        "Programming Language :: Python",
++        "Programming Language :: Python :: 2.7",
++        "Programming Language :: C",
++        "License :: OSI Approved :: GNU Lesser General Public License v3 (LGPLv3)",
++        "Operating System :: Unix",
++        "Development Status :: 5 - Production/Stable",
++        "Environment :: Plugins",
++        "Topic :: Software Development :: Libraries :: Python Modules",
++        "Topic :: Communications :: Usenet News"
++    ],
++    description     = "yEnc Module for Python modified for SABnzbd",
++    long_description = """
++yEnc Decoding for Python
++---------------------------------
++
++Mofied the original yenc module by Alessandro Duca for use within SABnzbd.
++
++The module was extended to do header parsing and full yEnc decoding from a Python
++list of chunks, the way in which data is retrieved from usenet.
++
++Currently CRC-checking of decoded data is disabled to allow for increased performance.
++It can only be re-enabled by locally altering 'sabyenc.h' and setting 'CRC_CHECK 1'.
++"""
++)
++
diff --cc src/sabyenc.c
index a0e4f4d,4796a45..6131118
--- a/src/sabyenc.c
+++ b/src/sabyenc.c
@@@ -1,622 -1,612 +1,623 @@@
-- /*=============================================================================
-- *
-- * Copyright (C) 2003, 2011 Alessandro Duca <alessandro.duca at gmail.com>
-- * Modified in 2016 by Safihre <safihre at sabnzbd.org> for use within SABnzbd
-- *
-- * This library is free software; you can redistribute it and/or
-- * modify it under the terms of the GNU Lesser General Public
-- * License as published by the Free Software Foundation; either
-- * version 2.1 of the License, or (at your option) any later version.
-- *
-- * This library is distributed in the hope that it will be useful,
-- * but WITHOUT ANY WARRANTY; without even the implied warranty of
-- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
-- * Lesser General Public License for more details.
-- *
-- * You should have received a copy of the GNU Lesser General Public
-- * License along with this library; if not, write to the Free Software
-- * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
-- *=============================================================================
-- */
--
--#include "sabyenc.h"
--
--/* Typedefs */
--typedef struct {
--    uInt crc;
--    uLong bytes;
--} Crc32;
--
--/* Declarations */
--static uInt crc_tab[256] = {
--    0x00000000, 0x77073096, 0xee0e612c, 0x990951ba, 0x076dc419, 0x706af48f,
--    0xe963a535, 0x9e6495a3, 0x0edb8832, 0x79dcb8a4, 0xe0d5e91e, 0x97d2d988,
--    0x09b64c2b, 0x7eb17cbd, 0xe7b82d07, 0x90bf1d91, 0x1db71064, 0x6ab020f2,
--    0xf3b97148, 0x84be41de, 0x1adad47d, 0x6ddde4eb, 0xf4d4b551, 0x83d385c7,
--    0x136c9856, 0x646ba8c0, 0xfd62f97a, 0x8a65c9ec, 0x14015c4f, 0x63066cd9,
--    0xfa0f3d63, 0x8d080df5, 0x3b6e20c8, 0x4c69105e, 0xd56041e4, 0xa2677172,
--    0x3c03e4d1, 0x4b04d447, 0xd20d85fd, 0xa50ab56b, 0x35b5a8fa, 0x42b2986c,
--    0xdbbbc9d6, 0xacbcf940, 0x32d86ce3, 0x45df5c75, 0xdcd60dcf, 0xabd13d59,
--    0x26d930ac, 0x51de003a, 0xc8d75180, 0xbfd06116, 0x21b4f4b5, 0x56b3c423,
--    0xcfba9599, 0xb8bda50f, 0x2802b89e, 0x5f058808, 0xc60cd9b2, 0xb10be924,
--    0x2f6f7c87, 0x58684c11, 0xc1611dab, 0xb6662d3d, 0x76dc4190, 0x01db7106,
--    0x98d220bc, 0xefd5102a, 0x71b18589, 0x06b6b51f, 0x9fbfe4a5, 0xe8b8d433,
--    0x7807c9a2, 0x0f00f934, 0x9609a88e, 0xe10e9818, 0x7f6a0dbb, 0x086d3d2d,
--    0x91646c97, 0xe6635c01, 0x6b6b51f4, 0x1c6c6162, 0x856530d8, 0xf262004e,
--    0x6c0695ed, 0x1b01a57b, 0x8208f4c1, 0xf50fc457, 0x65b0d9c6, 0x12b7e950,
--    0x8bbeb8ea, 0xfcb9887c, 0x62dd1ddf, 0x15da2d49, 0x8cd37cf3, 0xfbd44c65,
--    0x4db26158, 0x3ab551ce, 0xa3bc0074, 0xd4bb30e2, 0x4adfa541, 0x3dd895d7,
--    0xa4d1c46d, 0xd3d6f4fb, 0x4369e96a, 0x346ed9fc, 0xad678846, 0xda60b8d0,
--    0x44042d73, 0x33031de5, 0xaa0a4c5f, 0xdd0d7cc9, 0x5005713c, 0x270241aa,
--    0xbe0b1010, 0xc90c2086, 0x5768b525, 0x206f85b3, 0xb966d409, 0xce61e49f,
--    0x5edef90e, 0x29d9c998, 0xb0d09822, 0xc7d7a8b4, 0x59b33d17, 0x2eb40d81,
--    0xb7bd5c3b, 0xc0ba6cad, 0xedb88320, 0x9abfb3b6, 0x03b6e20c, 0x74b1d29a,
--    0xead54739, 0x9dd277af, 0x04db2615, 0x73dc1683, 0xe3630b12, 0x94643b84,
--    0x0d6d6a3e, 0x7a6a5aa8, 0xe40ecf0b, 0x9309ff9d, 0x0a00ae27, 0x7d079eb1,
--    0xf00f9344, 0x8708a3d2, 0x1e01f268, 0x6906c2fe, 0xf762575d, 0x806567cb,
--    0x196c3671, 0x6e6b06e7, 0xfed41b76, 0x89d32be0, 0x10da7a5a, 0x67dd4acc,
--    0xf9b9df6f, 0x8ebeeff9, 0x17b7be43, 0x60b08ed5, 0xd6d6a3e8, 0xa1d1937e,
--    0x38d8c2c4, 0x4fdff252, 0xd1bb67f1, 0xa6bc5767, 0x3fb506dd, 0x48b2364b,
--    0xd80d2bda, 0xaf0a1b4c, 0x36034af6, 0x41047a60, 0xdf60efc3, 0xa867df55,
--    0x316e8eef, 0x4669be79, 0xcb61b38c, 0xbc66831a, 0x256fd2a0, 0x5268e236,
--    0xcc0c7795, 0xbb0b4703, 0x220216b9, 0x5505262f, 0xc5ba3bbe, 0xb2bd0b28,
--    0x2bb45a92, 0x5cb36a04, 0xc2d7ffa7, 0xb5d0cf31, 0x2cd99e8b, 0x5bdeae1d,
--    0x9b64c2b0, 0xec63f226, 0x756aa39c, 0x026d930a, 0x9c0906a9, 0xeb0e363f,
--    0x72076785, 0x05005713, 0x95bf4a82, 0xe2b87a14, 0x7bb12bae, 0x0cb61b38,
--    0x92d28e9b, 0xe5d5be0d, 0x7cdcefb7, 0x0bdbdf21, 0x86d3d2d4, 0xf1d4e242,
--    0x68ddb3f8, 0x1fda836e, 0x81be16cd, 0xf6b9265b, 0x6fb077e1, 0x18b74777,
--    0x88085ae6, 0xff0f6a70, 0x66063bca, 0x11010b5c, 0x8f659eff, 0xf862ae69,
--    0x616bffd3, 0x166ccf45, 0xa00ae278, 0xd70dd2ee, 0x4e048354, 0x3903b3c2,
--    0xa7672661, 0xd06016f7, 0x4969474d, 0x3e6e77db, 0xaed16a4a, 0xd9d65adc,
--    0x40df0b66, 0x37d83bf0, 0xa9bcae53, 0xdebb9ec5, 0x47b2cf7f, 0x30b5ffe9,
--    0xbdbdf21c, 0xcabac28a, 0x53b39330, 0x24b4a3a6, 0xbad03605, 0xcdd70693,
--    0x54de5729, 0x23d967bf, 0xb3667a2e, 0xc4614ab8, 0x5d681b02, 0x2a6f2b94,
--    0xb40bbe37, 0xc30c8ea1, 0x5a05df1b, 0x2d02ef8d
--};
--
--/* Function declarations */
--static void crc_init(Crc32 *, uInt);
--static void crc_update(Crc32 *, uInt);
--void initsabyenc(void);
--static int decode_buffer_usenet(PyObject *, char *, int, char **, Crc32 *, uInt *,  Bool *);
--static char * find_text_in_pylist(PyObject *, char *, char **, int *);
--int extract_filename_from_pylist(PyObject *, int *, char **, char **, char **);
--int extract_int_from_pylist(PyObject *, int *, char **, char **, int);
--
--/* Python API requirements */
--static char decode_usenet_chunks_doc[] = "decode_usenet_chunks(list_of_chunks, nr_bytes)";
--
--static PyMethodDef funcs[] = {
--        {"decode_usenet_chunks", (PyCFunction) decode_usenet_chunks, METH_KEYWORDS | METH_VARARGS, decode_usenet_chunks_doc},
--        {NULL, NULL, 0, NULL}
--};
--
--/* Function definitions */
--static void crc_init(Crc32 *crc, uInt value) {
--    crc->crc = value;
--    crc->bytes = 0UL;
--}
--
--static void crc_update(Crc32 *crc, uInt c) {
--    crc->crc = crc_tab[(crc->crc^c)&0xff]^((crc->crc>>8)&0xffffff);
--    crc->bytes++;
--}
--
--static int decode_buffer_usenet(PyObject *Py_input_list, char *output_buffer, int num_bytes_reserved,
--                                char **filename_out,  Crc32 *crc, uInt *crc_yenc, Bool *crc_correct) {
--    // For the list
--    Py_ssize_t num_lines;
--    int list_index = 0;
--
--    // Search variables
--    char *cur_char; // Pointer to search result
--    char *start_loc; // Pointer to current char
--    char *crc_holder = NULL;
--
--    // Other vars
--    int part_begin = 0;
--    int part_size = 0;
--    int decoded_bytes = 0;
--    int safe_nr_bytes = 0;
--    Bool escape_char = 0;
--    int double_point_escape = 0;
--
--    /*
--     ANALYZE HEADER
--     Always in the same format, e.g.:
--
--     =ybegin part=41 line=128 size=49152000 name=90E2Sdvsmds0801dvsmds90E.part06.rar
--     =ypart begin=15360001 end=15744000
--
--     But we only care about the filename and the size
--     For single-part yEnc we need to get size from the first line, for
--     multi-part we need to substract end-begin from second line
--    */
--
--    // Get number of lines
--    num_lines = PyList_Size(Py_input_list);
--
--    // Get first chunk
--    cur_char = PyString_AsString(PyList_GetItem(Py_input_list, 0));
--
--    // Start of header (which doesn't have to be part of first chunk)
--    start_loc = find_text_in_pylist(Py_input_list, "=ybegin", &cur_char, &list_index);
--
--    if(start_loc) {
--        // First we find the size (for single-part files)
--        start_loc = find_text_in_pylist(Py_input_list, "size=", &cur_char, &list_index);
--        if(start_loc) {
--            // Move over a bit
--            part_size = extract_int_from_pylist(Py_input_list, &list_index, &start_loc, &cur_char, 0);
--        }
--
--        // Find name
--        start_loc = find_text_in_pylist(Py_input_list, "name=", &cur_char, &list_index);
--        if(start_loc) {
--            extract_filename_from_pylist(Py_input_list, &list_index, &start_loc, &cur_char, filename_out);
--        } else {
--            // Don't go on without a name
--            return 0;
--        }
--
--        // Is there a multi-part indicator?
--        start_loc = find_text_in_pylist(Py_input_list, "=ypart", &cur_char, &list_index);
--        if(start_loc) {
--            // Reset size, so we for sure don't use the previously found "size=" value
--            part_size = 0;
--
--            // Find part-begin
--            start_loc = find_text_in_pylist(Py_input_list, "begin=", &cur_char, &list_index);
--            if(start_loc) {
--                // Get begin
--                part_begin = extract_int_from_pylist(Py_input_list, &list_index, &start_loc, &cur_char, 0);
--
--                // Find part-end
--                start_loc = find_text_in_pylist(Py_input_list, "end=", &cur_char, &list_index);
--                if(start_loc) {
--                    // Move over a bit
--                    part_size = extract_int_from_pylist(Py_input_list, &list_index, &start_loc, &cur_char, 0) - part_begin + 1;
--                }
--            }
--
--            // We want to make sure it's a valid value
--            if(part_size <= 0  || part_size > num_bytes_reserved) {
--                // Set safe value
--                part_size = (int)(num_bytes_reserved*0.75);
--            }
--
--            // Skip over everything untill end of line, where the content starts
--            for( ; *cur_char != LF && *cur_char != CR && *cur_char != ZERO; cur_char++);
--        }
--
--        // How many bytes can be checked safely?
--        safe_nr_bytes = part_size ? part_size - 50 : 0;
--
--        /*
--            During the loop we need to take care of special cases.
--            The escape "=" and whatever it escapes might be on the
--            next Python-list-item. Also the sequence "\n.." should
--            onlyconvert one dot, but this sequence might also be
--            split across list items.
--        */
--        while(1) {
--            // Get current char and increment pointer
--            cur_char++;
--
--            // End of the line of list-item
--            if(*cur_char == ZERO) {
--                // Are we outside the list?
--                list_index++;
--                if(list_index == num_lines) {
--                    break;
--                }
--
--                // Get reference to the new line
--                cur_char = PyString_AsString(PyList_GetItem(Py_input_list, list_index));
--            }
--
--            // Special charaters
--            if(escape_char) {
--                *output_buffer++ = (*cur_char - 106);
--                escape_char = 0;
--                double_point_escape = 0;
--            } else if(*cur_char == ESC) {
--                // strncmp is expensive, only perform near the end
--                if(decoded_bytes > safe_nr_bytes) {
--                    /*
--                        Looking for the end, format:
--                        =yend size=384000 part=41 pcrc32=084e170f
--                        If a = is followed by an end-of-line, it's very
--                        likely that the yend part is on the next line
--                        and thus we would miss it
--                    */
--                    if(*(cur_char+1) == ZERO && list_index+1 < num_lines) {
--                        // Quick and dirty check if it's in next line
--                        crc_holder = PyString_AsString(PyList_GetItem(Py_input_list, list_index+1));
--                        // If that's not the case, we don't want to mess with the regular flow!!
--                        if(!strncmp(crc_holder, "yend", 4)) {
--                            cur_char = crc_holder;
--                        }
--                    }
--
--                    // Find it!
--                    if (!strncmp(cur_char, "=y", 2) || !strncmp(cur_char, "yend", 4)) {
--#if CRC_CHECK
--                        // Find CRC
--                        start_loc = find_text_in_pylist(Py_input_list, "crc32=", &cur_char, &list_index);
--
--                        // Process CRC
--                        if(start_loc) {
--                            *crc_yenc = extract_int_from_pylist(Py_input_list, &list_index, &start_loc, &cur_char, 1);
--
--                            // Change format to CRC-style (don't ask me why..)
--                            *crc_yenc = -1*(*crc_yenc)-1;
--
--                            // Check if CRC is correct
--                            if(crc->crc == *crc_yenc) {
--                                *crc_correct = 1;
--                            }
--                        }
--#else
--                        // Do a simple check based on size, faster than CRC
--                        if(part_size != decoded_bytes) {
--                            *crc_correct = 0;
--                        } else {
--                            *crc_correct = 1;
--                        }
--#endif
--                        break;
--                    }
--                }
--
--                // Becaus the escape might be at the end of the chunk
--                // we need to do it in the next loop
--                escape_char = 1;
--                continue;
--            } else if(*cur_char == CR) {
--                continue;
--            } else if(*cur_char == LF) {
--                double_point_escape = 1;
--                continue;
--
--            /*
--                "The NNTP-protocol requires to double a dot
--                in the first colum when a line is sent"
--
--                For some magical reason clang gets 2x slower
--                overall when using the second approach.
--                It does make things 15% faster for gcc and msvc
--                So we take this convoluted approach to be safe.
--            */
--#ifdef __clang__
--            } else if(double_point_escape == 2 && *cur_char == DOT) {
--                //
--                // We found "\n.."! Ignore that second dot.
--                double_point_escape = 0;
--                continue;
--            } else if(*cur_char == DOT) {
--                // Special case for "\n.." that can be split between list items
--                if(double_point_escape == 1) {
--                    double_point_escape = 2;
--                }
--#else
--            } else if(*cur_char == DOT) {
--                // "The NNTP-protocol requires to double a dot in the first colum when a line is sent"
--                // We found "\n.."! Ignore that second dot.
--                if(double_point_escape == 2) {
--                    double_point_escape = 0;
--                    continue;
--                }
--                // Special case for "\n.." that can be split between list items
--                if(double_point_escape == 1) {
--                    double_point_escape = 2;
--                }
--#endif
--                // We do include this dot
--                *output_buffer++ = (*cur_char - 42);
--            } else {
--                *output_buffer++ = (*cur_char - 42);
--                // Reset exception
--                double_point_escape = 0;
--            }
--
--            // Increase byte counter for saftey check
--            decoded_bytes++;
--
--#if CRC_CHECK
--            // Check CRC value
--            crc_update(crc, *(output_buffer-1));
--#endif
--
--            // Saftey check
--            if(decoded_bytes == num_bytes_reserved) {
--                break;
--            }
--        }
--    }
--    return decoded_bytes;
--}
--
--
--/*
--    We need a special function to find the keywords
--    because they can be split over multiple chunks.
--*/
--static char * find_text_in_pylist(PyObject *Py_input_list, char *search_term, char **cur_char, int *cur_index) {
--    // String holders
--    char *next_string = NULL;
--    char *start_loc = NULL;
--    char *search_placeholder;
--    // Size holders
--    size_t cur_len;
--    int start_index;
--    int init_index = *cur_index;
--    Py_ssize_t max_extra_lines = PyList_Size(Py_input_list) - 1;
--
--    // First we try to do a fast location
--    start_loc = strstr(*cur_char, search_term);
--
--    // We didn't find it..
--    if(!start_loc) {
--        // We do maximum of 3 times extra lines, otherwise to slow
--        max_extra_lines = (*cur_index+3 >= max_extra_lines) ?  max_extra_lines : *cur_index+3;
--
--        // Start by adding the current string to the placeholder
--        cur_len = strlen(*cur_char)+1;
--        search_placeholder = (char *) calloc(cur_len, sizeof(char *));
--        strcpy(search_placeholder, *cur_char);
--
--        // Add the next item and try again
--        while(!start_loc && *cur_index < max_extra_lines) {
--            // Need to get the next one
--            *cur_index = *cur_index+1;
--            next_string = PyString_AsString(PyList_GetItem(Py_input_list, *cur_index));
--
--            // Reserve the next bit
--            cur_len = cur_len + strlen(next_string);
--            search_placeholder = (char *) realloc(search_placeholder, cur_len);
--            strcat(search_placeholder, next_string);
--
--            // Try to find it again
--            start_loc = strstr(search_placeholder, search_term);
--        }
--
--        /*
--            Problem: If we return start_loc now, we will have a memory leak
--            because search_placeholder is never free'd. So we need to get
--            the correct location in the current string from the list.
--        */
--        if(start_loc) {
--            // How much in the new string are we?
--            start_index = (int)(start_loc - search_placeholder) - (int)(strlen(search_placeholder) - strlen(next_string));
--            // Just make sure it's valid
--            if(start_index < 0 || start_index > (int)strlen(next_string)) {
--                start_loc = NULL;
--            }
--            // Point to the location in the item from the list
--            start_loc = next_string + start_index;
--        } else {
--            // Decrease the index to where we begun
--            *cur_index = init_index;
--        }
--
--        // Cleanup
--        free(search_placeholder);
--    }
--
--    // Did we find it now?
--    if(start_loc) {
--        start_loc += strlen(search_term);
--        *cur_char = start_loc;
--    }
--
--    // Found it directly
--    return start_loc;
--}
--
--
--/*
--    Integer values like "begin=1234" or "pcrc=ABCDE" can also
--    be split over multiple lines. And thus we need to really
--    check that we did not reach the end of a line every time.
--*/
--int extract_int_from_pylist(PyObject *Py_input_list, int *cur_index, char **start_loc, char **cur_char, int crc) {
--    char *enc_loc;
--    char *item_holder;
--    char *combi_holder;
--    int part_value = 0;
--    Py_ssize_t max_lines = PyList_Size(Py_input_list);
--
--    // Crc calculation?
--    if(crc) {
--        part_value = strtoul(*start_loc, &enc_loc, 16);
--    } else {
--        part_value = strtol(*start_loc, &enc_loc, 0);
--    }
--
--    // Did we reach the end of a line?
--    if(*enc_loc == ZERO) {
--        // Do we even have another item?
--        if(*cur_index+1 >= max_lines) return part_value;
--
--        // We need to fix things by combining the 2 lines
--        combi_holder = (char *) calloc(strlen(*start_loc)+1, sizeof(char *));
--        strcpy(combi_holder, *start_loc);
--        *cur_index = *cur_index+1;
--        item_holder = PyString_AsString(PyList_GetItem(Py_input_list, *cur_index));
--        combi_holder = (char *) realloc(combi_holder, strlen(*start_loc)+strlen(item_holder)+1);
--        strcat(combi_holder, item_holder);
--
--        // Now we do it again
--        if(crc) {
--            part_value = strtoul(combi_holder, &enc_loc, 16);
--        } else {
--            part_value = strtol(combi_holder, &enc_loc, 0);
--        }
--
--        // Free the space
--        free(combi_holder);
--        // Set the current position
--        *cur_char = item_holder;
--    } else {
--        // Move pointer
--        *cur_char = enc_loc;
--    }
--
--    return part_value;
--}
--
--
--/*
--    Filename can also be split over multiple lines
--    and thus needs saftey checks!
--*/
--int extract_filename_from_pylist(PyObject *Py_input_list, int *cur_index, char **start_loc, char **cur_char, char **filename_ptr) {
--    // Temporary holders
--    char *end_loc;
--    Py_ssize_t max_lines = PyList_Size(Py_input_list);
--
--    // Start at current setting
--    end_loc = *start_loc;
--    while(1) {
--        // Did we reach end of the line but not newline?
--        if(*(end_loc+1) == CR || *(end_loc+1) == LF || *(end_loc+1) == ZERO) {
--            // Did we allocate yet?
--            if(!*filename_ptr) {
--                // Reserve space (plus current char and terminator)
--                *filename_ptr = (char *)calloc(end_loc - *start_loc + 2, sizeof(char));
--                // Allocation check
--                if(!filename_ptr) return 0;
--                // Copy the text, including the current char
--                strncpy(*filename_ptr, *start_loc, end_loc - *start_loc + 1);
--                // Add termininator
--                (*filename_ptr)[strlen(*filename_ptr)] = ZERO;
--                // Was this the end?
--                if(*(end_loc+1) == CR || *(end_loc+1) == LF) {
--                    // Move the pointer and return
--                    *cur_char = end_loc+1;
--                    return 1;
--                } else {
--                    // Do we even have another item?
--                    if(*cur_index+1 >= max_lines) return 0;
--                    // Need to get the next one
--                    *cur_index = *cur_index+1;
--                    *start_loc = end_loc = PyString_AsString(PyList_GetItem(Py_input_list, *cur_index));
--                }
--            } else {
--                // Expand the result to hold this new bit (plus current char and terminator)
--                *filename_ptr = (char *)realloc(*filename_ptr, strlen(*filename_ptr) + end_loc - *start_loc + 2);
--                // Allocation check
--                if(!filename_ptr) return 0;
--                // Copy result at the end
--                strncat(*filename_ptr, *start_loc, end_loc - *start_loc + 1);
--                // Add termininator
--                (*filename_ptr)[strlen(*filename_ptr)] = ZERO;
--                // Move the pointer and return
--                *cur_char = end_loc+1;
--                return 1;
--            }
--        } else {
--            // Move 1 char forward, not if we just fetched new chunk
--            end_loc++;
--        }
--    }
--}
--
--
--PyObject* decode_usenet_chunks(PyObject* self, PyObject* args, PyObject* kwds) {
--    // The input/output PyObjects
--    PyObject *Py_input_list;
--    PyObject *Py_output_buffer;
--    PyObject *Py_output_filename;
--    PyObject *retval = NULL;
--
--    // CRC
--    Crc32 crc;
--    uInt crc_yenc = 0;
--    Bool crc_correct = 0;
--    uInt crc_value = 0xffffffffll;
--
--    // Buffers
--    char *output_buffer = NULL;
--    char *filename_out = NULL;
--    uInt output_len = 0;
--    int num_bytes_reserved;
-     int lp_max;
-     int lp;
--
--    // Parse input
--    if (!PyArg_ParseTuple(args, "Oi:decode_usenet_chunks", &Py_input_list, &num_bytes_reserved)) {
--        return NULL;
--    }
--
--    // Verify it's a list
--    if(!PyList_Check(Py_input_list)) {
--        PyErr_SetString(PyExc_TypeError, "Expected list");
--        return NULL;
-     }
- 
-     // If we did not get a size, we need to calculate it (slower, but safer)
-     if(num_bytes_reserved <= 0) {
-         lp_max = (int)PyList_Size(Py_input_list);
-         for(lp = 0; lp < lp_max; lp++) {
-             num_bytes_reserved += (int)PyString_Size(PyList_GetItem(Py_input_list, lp));
-         }
--    }
--
--    // Reserve the output buffer, 10% more just to be safe
--    num_bytes_reserved = (int)(num_bytes_reserved*1.10);
--    output_buffer = (char *)malloc(num_bytes_reserved);
--    if(!output_buffer) {
--        retval = PyErr_NoMemory();
--        return NULL;
--    }
--
--    // Byeeeeeeee GIL!
--    Py_BEGIN_ALLOW_THREADS;
--
--    // Initial CRC
--    crc_init(&crc, crc_value);
--
--    // Calculate
--    output_len = decode_buffer_usenet(Py_input_list, output_buffer, num_bytes_reserved, &filename_out, &crc, &crc_yenc, &crc_correct);
--
--    // Aaah there you are again GIL..
--    Py_END_ALLOW_THREADS;
--
--    // Catch if there's nothing
--    if(!output_len || !filename_out) {
--        PyErr_SetString(PyExc_ValueError, "Could not get filename");
--        // Saftey free's
--        if(output_buffer) free(output_buffer);
--        if(filename_out) free(filename_out);
--        return NULL;
--    }
--
--    // Prepare output
--    Py_output_buffer = PyString_FromStringAndSize((char *)output_buffer, output_len);
--
--    // Use special Python function to go from Latin-1 to Unicode
--    Py_output_filename = PyUnicode_DecodeLatin1((char *)filename_out, strlen((char *)filename_out), NULL);
--
--    // Build output
--    retval = Py_BuildValue("(S,S,L,L,O)", Py_output_buffer, Py_output_filename, (long long)crc.crc, (long long)crc_yenc, crc_correct ? Py_True: Py_False);
--
--    // Make sure we free all the buffers!
--    Py_XDECREF(Py_output_buffer);
--    Py_XDECREF(Py_output_filename);
--    free(output_buffer);
--    free(filename_out);
--    return retval;
--}
--
--
--void initsabyenc(void) {
--    // Add module
--    PyObject *module;
--    module = Py_InitModule3("sabyenc", funcs, "Raw yenc operations");
--
--    // Add version
--    PyModule_AddStringConstant(module, "__version__", SABYENC_VERSION);
--}
--
++ /*=============================================================================
++ *
++ * Copyright (C) 2003, 2011 Alessandro Duca <alessandro.duca at gmail.com>
++ * Modified in 2016 by Safihre <safihre at sabnzbd.org> for use within SABnzbd
++ *
++ * This library is free software; you can redistribute it and/or
++ * modify it under the terms of the GNU Lesser General Public
++ * License as published by the Free Software Foundation; either
++ * version 2.1 of the License, or (at your option) any later version.
++ *
++ * This library is distributed in the hope that it will be useful,
++ * but WITHOUT ANY WARRANTY; without even the implied warranty of
++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
++ * Lesser General Public License for more details.
++ *
++ * You should have received a copy of the GNU Lesser General Public
++ * License along with this library; if not, write to the Free Software
++ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
++ *=============================================================================
++ */
++
++#include "sabyenc.h"
++
++/* Typedefs */
++typedef struct {
++    uInt crc;
++    uLong bytes;
++} Crc32;
++
++/* Declarations */
++static uInt crc_tab[256] = {
++    0x00000000, 0x77073096, 0xee0e612c, 0x990951ba, 0x076dc419, 0x706af48f,
++    0xe963a535, 0x9e6495a3, 0x0edb8832, 0x79dcb8a4, 0xe0d5e91e, 0x97d2d988,
++    0x09b64c2b, 0x7eb17cbd, 0xe7b82d07, 0x90bf1d91, 0x1db71064, 0x6ab020f2,
++    0xf3b97148, 0x84be41de, 0x1adad47d, 0x6ddde4eb, 0xf4d4b551, 0x83d385c7,
++    0x136c9856, 0x646ba8c0, 0xfd62f97a, 0x8a65c9ec, 0x14015c4f, 0x63066cd9,
++    0xfa0f3d63, 0x8d080df5, 0x3b6e20c8, 0x4c69105e, 0xd56041e4, 0xa2677172,
++    0x3c03e4d1, 0x4b04d447, 0xd20d85fd, 0xa50ab56b, 0x35b5a8fa, 0x42b2986c,
++    0xdbbbc9d6, 0xacbcf940, 0x32d86ce3, 0x45df5c75, 0xdcd60dcf, 0xabd13d59,
++    0x26d930ac, 0x51de003a, 0xc8d75180, 0xbfd06116, 0x21b4f4b5, 0x56b3c423,
++    0xcfba9599, 0xb8bda50f, 0x2802b89e, 0x5f058808, 0xc60cd9b2, 0xb10be924,
++    0x2f6f7c87, 0x58684c11, 0xc1611dab, 0xb6662d3d, 0x76dc4190, 0x01db7106,
++    0x98d220bc, 0xefd5102a, 0x71b18589, 0x06b6b51f, 0x9fbfe4a5, 0xe8b8d433,
++    0x7807c9a2, 0x0f00f934, 0x9609a88e, 0xe10e9818, 0x7f6a0dbb, 0x086d3d2d,
++    0x91646c97, 0xe6635c01, 0x6b6b51f4, 0x1c6c6162, 0x856530d8, 0xf262004e,
++    0x6c0695ed, 0x1b01a57b, 0x8208f4c1, 0xf50fc457, 0x65b0d9c6, 0x12b7e950,
++    0x8bbeb8ea, 0xfcb9887c, 0x62dd1ddf, 0x15da2d49, 0x8cd37cf3, 0xfbd44c65,
++    0x4db26158, 0x3ab551ce, 0xa3bc0074, 0xd4bb30e2, 0x4adfa541, 0x3dd895d7,
++    0xa4d1c46d, 0xd3d6f4fb, 0x4369e96a, 0x346ed9fc, 0xad678846, 0xda60b8d0,
++    0x44042d73, 0x33031de5, 0xaa0a4c5f, 0xdd0d7cc9, 0x5005713c, 0x270241aa,
++    0xbe0b1010, 0xc90c2086, 0x5768b525, 0x206f85b3, 0xb966d409, 0xce61e49f,
++    0x5edef90e, 0x29d9c998, 0xb0d09822, 0xc7d7a8b4, 0x59b33d17, 0x2eb40d81,
++    0xb7bd5c3b, 0xc0ba6cad, 0xedb88320, 0x9abfb3b6, 0x03b6e20c, 0x74b1d29a,
++    0xead54739, 0x9dd277af, 0x04db2615, 0x73dc1683, 0xe3630b12, 0x94643b84,
++    0x0d6d6a3e, 0x7a6a5aa8, 0xe40ecf0b, 0x9309ff9d, 0x0a00ae27, 0x7d079eb1,
++    0xf00f9344, 0x8708a3d2, 0x1e01f268, 0x6906c2fe, 0xf762575d, 0x806567cb,
++    0x196c3671, 0x6e6b06e7, 0xfed41b76, 0x89d32be0, 0x10da7a5a, 0x67dd4acc,
++    0xf9b9df6f, 0x8ebeeff9, 0x17b7be43, 0x60b08ed5, 0xd6d6a3e8, 0xa1d1937e,
++    0x38d8c2c4, 0x4fdff252, 0xd1bb67f1, 0xa6bc5767, 0x3fb506dd, 0x48b2364b,
++    0xd80d2bda, 0xaf0a1b4c, 0x36034af6, 0x41047a60, 0xdf60efc3, 0xa867df55,
++    0x316e8eef, 0x4669be79, 0xcb61b38c, 0xbc66831a, 0x256fd2a0, 0x5268e236,
++    0xcc0c7795, 0xbb0b4703, 0x220216b9, 0x5505262f, 0xc5ba3bbe, 0xb2bd0b28,
++    0x2bb45a92, 0x5cb36a04, 0xc2d7ffa7, 0xb5d0cf31, 0x2cd99e8b, 0x5bdeae1d,
++    0x9b64c2b0, 0xec63f226, 0x756aa39c, 0x026d930a, 0x9c0906a9, 0xeb0e363f,
++    0x72076785, 0x05005713, 0x95bf4a82, 0xe2b87a14, 0x7bb12bae, 0x0cb61b38,
++    0x92d28e9b, 0xe5d5be0d, 0x7cdcefb7, 0x0bdbdf21, 0x86d3d2d4, 0xf1d4e242,
++    0x68ddb3f8, 0x1fda836e, 0x81be16cd, 0xf6b9265b, 0x6fb077e1, 0x18b74777,
++    0x88085ae6, 0xff0f6a70, 0x66063bca, 0x11010b5c, 0x8f659eff, 0xf862ae69,
++    0x616bffd3, 0x166ccf45, 0xa00ae278, 0xd70dd2ee, 0x4e048354, 0x3903b3c2,
++    0xa7672661, 0xd06016f7, 0x4969474d, 0x3e6e77db, 0xaed16a4a, 0xd9d65adc,
++    0x40df0b66, 0x37d83bf0, 0xa9bcae53, 0xdebb9ec5, 0x47b2cf7f, 0x30b5ffe9,
++    0xbdbdf21c, 0xcabac28a, 0x53b39330, 0x24b4a3a6, 0xbad03605, 0xcdd70693,
++    0x54de5729, 0x23d967bf, 0xb3667a2e, 0xc4614ab8, 0x5d681b02, 0x2a6f2b94,
++    0xb40bbe37, 0xc30c8ea1, 0x5a05df1b, 0x2d02ef8d
++};
++
++/* Function declarations */
++static void crc_init(Crc32 *, uInt);
++static void crc_update(Crc32 *, uInt);
++void initsabyenc(void);
++static int decode_buffer_usenet(PyObject *, char *, int, char **, Crc32 *, uInt *,  Bool *);
++static char * find_text_in_pylist(PyObject *, char *, char **, int *);
++int extract_filename_from_pylist(PyObject *, int *, char **, char **, char **);
++int extract_int_from_pylist(PyObject *, int *, char **, char **, int);
++
++/* Python API requirements */
++static char decode_usenet_chunks_doc[] = "decode_usenet_chunks(list_of_chunks, nr_bytes)";
++
++static PyMethodDef funcs[] = {
++        {"decode_usenet_chunks", (PyCFunction) decode_usenet_chunks, METH_KEYWORDS | METH_VARARGS, decode_usenet_chunks_doc},
++        {NULL, NULL, 0, NULL}
++};
++
++/* Function definitions */
++static void crc_init(Crc32 *crc, uInt value) {
++    crc->crc = value;
++    crc->bytes = 0UL;
++}
++
++static void crc_update(Crc32 *crc, uInt c) {
++    crc->crc = crc_tab[(crc->crc^c)&0xff]^((crc->crc>>8)&0xffffff);
++    crc->bytes++;
++}
++
++static int decode_buffer_usenet(PyObject *Py_input_list, char *output_buffer, int num_bytes_reserved,
++                                char **filename_out,  Crc32 *crc, uInt *crc_yenc, Bool *crc_correct) {
++    // For the list
++    Py_ssize_t num_lines;
++    int list_index = 0;
++
++    // Search variables
++    char *cur_char; // Pointer to search result
++    char *start_loc; // Pointer to current char
++    char *crc_holder = NULL;
++
++    // Other vars
++    char byte;
++    int part_begin = 0;
++    int part_size = 0;
++    int decoded_bytes = 0;
++    int safe_nr_bytes = 0;
++    Bool escape_char = 0;
++    int double_point_escape = 0;
++
++    /*
++     ANALYZE HEADER
++     Always in the same format, e.g.:
++
++     =ybegin part=41 line=128 size=49152000 name=90E2Sdvsmds0801dvsmds90E.part06.rar
++     =ypart begin=15360001 end=15744000
++
++     But we only care about the filename and the size
++     For single-part yEnc we need to get size from the first line, for
++     multi-part we need to substract end-begin from second line
++    */
++
++    // Get number of lines
++    num_lines = PyList_Size(Py_input_list);
++
++    // Get first chunk
++    cur_char = PyString_AsString(PyList_GetItem(Py_input_list, 0));
++
++    // Start of header (which doesn't have to be part of first chunk)
++    start_loc = find_text_in_pylist(Py_input_list, "=ybegin", &cur_char, &list_index);
++
++    if(start_loc) {
++        // First we find the size (for single-part files)
++        start_loc = find_text_in_pylist(Py_input_list, "size=", &cur_char, &list_index);
++        if(start_loc) {
++            // Move over a bit
++            part_size = extract_int_from_pylist(Py_input_list, &list_index, &start_loc, &cur_char, 0);
++        }
++
++        // Find name
++        start_loc = find_text_in_pylist(Py_input_list, "name=", &cur_char, &list_index);
++        if(start_loc) {
++            extract_filename_from_pylist(Py_input_list, &list_index, &start_loc, &cur_char, filename_out);
++        } else {
++            // Don't go on without a name
++            return 0;
++        }
++
++        // Is there a multi-part indicator?
++        start_loc = find_text_in_pylist(Py_input_list, "=ypart", &cur_char, &list_index);
++        if(start_loc) {
++            // Reset size, so we for sure don't use the previously found "size=" value
++            part_size = 0;
++
++            // Find part-begin
++            start_loc = find_text_in_pylist(Py_input_list, "begin=", &cur_char, &list_index);
++            if(start_loc) {
++                // Get begin
++                part_begin = extract_int_from_pylist(Py_input_list, &list_index, &start_loc, &cur_char, 0);
++
++                // Find part-end
++                start_loc = find_text_in_pylist(Py_input_list, "end=", &cur_char, &list_index);
++                if(start_loc) {
++                    // Move over a bit
++                    part_size = extract_int_from_pylist(Py_input_list, &list_index, &start_loc, &cur_char, 0) - part_begin + 1;
++                }
++            }
++
++            // We want to make sure it's a valid value
++            if(part_size <= 0  || part_size > num_bytes_reserved) {
++                // Set safe value
++                part_size = (int)(num_bytes_reserved*0.75);
++            }
++
++            // Skip over everything untill end of line, where the content starts
++            for( ; *cur_char != LF && *cur_char != CR && *cur_char != ZERO; cur_char++);
++        }
++
++        // How many bytes can be checked safely?
++        safe_nr_bytes = part_size ? part_size - 50 : 0;
++
++        /*
++            During the loop we need to take care of special cases.
++            The escape "=" and whatever it escapes might be on the
++            next Python-list-item. Also the sequence "\n.." should
++            onlyconvert one dot, but this sequence might also be
++            split across list items.
++        */
++        while(1) {
++            // Get current char and increment pointer
++            cur_char++;
++
++            // End of the line of list-item
++            if(*cur_char == ZERO) {
++                // Are we outside the list?
++                list_index++;
++                if(list_index == num_lines) {
++                    break;
++                }
++
++                // Get reference to the new line
++                cur_char = PyString_AsString(PyList_GetItem(Py_input_list, list_index));
++            }
++
++            // Special charaters
++            if(escape_char) {
++                *output_buffer++ = (*cur_char - 106);
++                escape_char = 0;
++                double_point_escape = 0;
++            } else if(*cur_char == ESC) {
++                // strncmp is expensive, only perform near the end
++                if(decoded_bytes > safe_nr_bytes) {
++                    /*
++                        Looking for the end, format:
++                        =yend size=384000 part=41 pcrc32=084e170f
++                        If a = is followed by an end-of-line, it's very
++                        likely that the yend part is on the next line
++                        and thus we would miss it
++                    */
... 496 lines suppressed ...

-- 
Alioth's /usr/local/bin/git-commit-notice on /srv/git.debian.org/git/python-modules/packages/python-sabyenc.git



More information about the Python-modules-commits mailing list