[med-svn] [Git][med-team/cyvcf2][upstream] New upstream version 0.30.28
Andreas Tille (@tille)
gitlab at salsa.debian.org
Wed Feb 7 10:40:44 GMT 2024
Andreas Tille pushed to branch upstream at Debian Med / cyvcf2
Commits:
7c97cba8 by Andreas Tille at 2024-02-07T09:56:39+01:00
New upstream version 0.30.28
- - - - -
24 changed files:
- .github/workflows/build.yml
- .github/workflows/wheels.yml
- .gitignore
- CHANGES.md
- MANIFEST.in
- README.md
- + ci/Dockerfile.alpine.test
- ci/Dockerfile.test → ci/Dockerfile.slim.test
- ci/linux-deps
- − ci/osx-arm64-deps
- ci/osx-deps
- cyvcf2/__init__.py
- cyvcf2/cyvcf2.pxd
- cyvcf2/cyvcf2.pyx
- cyvcf2/helpers.c
- + cyvcf2/tests/multi-contig.bcf
- + cyvcf2/tests/multi-contig.bcf.csi
- + cyvcf2/tests/multi-contig.vcf.gz
- + cyvcf2/tests/multi-contig.vcf.gz.csi
- + cyvcf2/tests/multi-contig.vcf.gz.tbi
- cyvcf2/tests/test_reader.py
- pyproject.toml
- requirements.txt
- setup.py
Changes:
=====================================
.github/workflows/build.yml
=====================================
@@ -3,14 +3,25 @@ name: Build
on: [push, pull_request]
jobs:
- docker-build-and-test:
- name: Docker Build and Test on ${{ matrix.platform }}
- runs-on: ubuntu-latest
+ docker-build:
+ name: Docker Run Test on ${{ matrix.platform }}-${{ matrix.python_tag_type }}
+ runs-on: ubuntu-22.04
strategy:
matrix:
platform:
- linux/amd64
- linux/arm64
+ python_tag_type:
+ - slim
+ - alpine
+ exclude:
+ # amd64 with glibc have full direct test
+ - platform: linux/amd64
+ python_tag_type: slim
+
+ # test alpine only on amd64
+ - platform: linux/arm64
+ python_tag_type: alpine
steps:
- uses: actions/checkout at v4
@@ -20,51 +31,184 @@ jobs:
uses: docker/setup-qemu-action at v3
- name: Set up Docker Buildx
uses: docker/setup-buildx-action at v3
- - name: Docker Build and Push
+
+ - name: Docker Build
uses: docker/build-push-action at v5
with:
- context: .
- file: ./ci/Dockerfile.test
+ context: .
+ file: ./ci/Dockerfile.${{ matrix.python_tag_type }}.test
platforms: ${{ matrix.platform }}
- tags: cyvcf2:test
+ tags: cyvcf2:${{ matrix.python_tag_type }}-test
push: false
load: true
- build-args: |
- PYTHON_VERSION=slim
+ build-args: |
+ PYTHON_VERSION=${{ matrix.python_tag_type }}
- name: Docker Run Tests
run: |
- docker run --rm --platform ${{ matrix.platform }} cyvcf2:test pytest --cov cyvcf2 --cov-report term-missing
+ docker run --rm --platform ${{ matrix.platform }} cyvcf2:${{ matrix.python_tag_type }}-test pytest --cov cyvcf2 --cov-report term-missing
build:
- name: Run tests on Python ${{ matrix.python-version }}
- runs-on: ubuntu-20.04
+ name: Run tests on Python ${{ matrix.python-version }} ${{ matrix.os }}
+ runs-on: ${{ matrix.os }}
+ strategy:
+ matrix:
+ os: [ubuntu-22.04, macos-12]
+ python-version:
+ ["pypy3.10", "3.7", "3.8", "3.9", "3.10", "3.11", "3.12"]
+ exclude:
+ # Run only the latest versions on macOS and windows
+ - os: macos-12
+ python-version: "pypy3.10"
+ - os: macos-12
+ python-version: "3.7"
+ - os: macos-12
+ python-version: "3.8"
+ - os: macos-12
+ python-version: "3.9"
+ - os: macos-12
+ python-version: "3.10"
+ - os: macos-12
+ python-version: "3.11"
+
+ steps:
+ - uses: actions/checkout at v4
+ with:
+ submodules: recursive
+ - name: Set up Python ${{ matrix.python-version }}
+ uses: actions/setup-python at v5
+ with:
+ python-version: ${{ matrix.python-version }}
+
+ - name: Set macOS env
+ if: runner.os == 'macOS'
+ run: |
+ # building options
+ echo "MACOSX_DEPLOYMENT_TARGET=10.9" >> "$GITHUB_ENV"
+ echo "ARCHFLAGS=-arch x86_64" >> "$GITHUB_ENV"
+
+ - name: Install Linux build prerequisites
+ if: runner.os == 'Linux'
+ run: |
+ sudo apt-get update
+ sudo apt-get install -y --no-install-recommends libcurl4-openssl-dev zlib1g-dev libssl-dev liblzma-dev \
+ libbz2-dev libdeflate-dev
+
+ - name: Install macOS build prerequisites
+ if: runner.os == 'macOS'
+ run: |
+ brew install automake libdeflate
+
+ - name: Install
+ run: |
+ pip install -r requirements.txt
+ pip install pytest pytest-cov
+ CYVCF2_HTSLIB_CONFIGURE_OPTIONS="--enable-libcurl --enable-s3 --enable-lzma --enable-bz2 --with-libdeflate" \
+ CYTHONIZE=1 python setup.py build_ext -i
+
+ - name: Test
+ run: |
+ pytest --cov cyvcf2 --cov-report term-missing
+
+ windows_build:
+ name: Run tests on Python windows-2022 MSYS2 UCRT64
+ runs-on: windows-2022
+ defaults:
+ run:
+ shell: msys2 {0}
+
+ steps:
+ - uses: actions/checkout at v4
+ with:
+ submodules: recursive
+
+ - name: "Setup MSYS2"
+ uses: msys2/setup-msys2 at v2
+ with:
+ msystem: UCRT64
+ path-type: inherit
+ install: >-
+ mingw-w64-ucrt-x86_64-gcc
+ mingw-w64-ucrt-x86_64-make
+ mingw-w64-ucrt-x86_64-libdeflate
+ mingw-w64-ucrt-x86_64-xz
+ mingw-w64-ucrt-x86_64-curl
+ mingw-w64-ucrt-x86_64-zlib
+ mingw-w64-ucrt-x86_64-bzip2
+ mingw-w64-ucrt-x86_64-tools-git
+ mingw-w64-ucrt-x86_64-python-pkgconfig
+ mingw-w64-ucrt-x86_64-pkg-config
+ mingw-w64-ucrt-x86_64-ninja
+ mingw-w64-ucrt-x86_64-python
+ mingw-w64-ucrt-x86_64-python-pip
+ make
+ automake
+ autoconf
+ git
+
+ - name: Install Windows build prerequisites
+ run: |
+ cd htslib
+ autoreconf -i
+ ./configure --enable-libcurl --enable-s3 --enable-lzma --enable-bz2 --with-libdeflate
+ make
+ make install
+
+ - name: Install
+ run: |
+ pip install -r requirements.txt
+ pip install pytest pytest-cov
+ CYTHONIZE=1 python setup.py build_ext -i
+
+ - name: Test
+ run: |
+ pytest --cov cyvcf2 --cov-report term-missing
+
+ sdist:
+ runs-on: ubuntu-22.04
strategy:
matrix:
- python-version: ["3.7", "3.8", "3.9", "3.10", "3.11", "3.12"]
+ python-version: ["3.12"]
steps:
- - uses: actions/checkout at v3
- with:
- submodules: true
- - name: Set up Python ${{ matrix.python-version }}
- uses: actions/setup-python at v4
- with:
- python-version: ${{ matrix.python-version }}
- - name: Install
- run: |
- sudo apt-get update
- sudo apt-get install libcurl4-openssl-dev
- pip install -r requirements.txt
- pip install pytest pytest-cov
- git submodule update --init --recursive
- cd htslib
- autoheader && autoconf && autoreconf --install
- ./configure --enable-s3 --disable-lzma --disable-bz2
- make
- cd ..
- CYTHONIZE=1 python setup.py build_ext -i
- - name: Test
- run: |
- pytest --cov cyvcf2 --cov-report term-missing
+ - uses: actions/checkout at v4
+ with:
+ submodules: recursive
+ - name: Set up Python ${{ matrix.python-version }}
+ uses: actions/setup-python at v5
+ with:
+ python-version: ${{ matrix.python-version }}
+
+ - name: Install sdist prerequisites
+ run: |
+ pip install -r requirements.txt
+
+ - name: Create source distribution
+ run: CYTHONIZE=1 python setup.py sdist
+
+ - name: Install Linux build prerequisites
+ if: runner.os == 'Linux'
+ run: |
+ sudo apt-get update
+ sudo apt-get install -y --no-install-recommends libcurl4-openssl-dev zlib1g-dev libssl-dev liblzma-dev \
+ libbz2-dev libdeflate-dev
+ - name: Build (via sdist tarball)
+ run: pip install --verbose --no-deps --no-binary='cyvcf2' cyvcf2-*.tar.gz
+ working-directory: dist
+
+ - name: Install test prerequisites
+ run: |
+ pip install pytest pytest-cov
+
+ - name: Test
+ run: |
+ pytest --import-mode importlib --cov cyvcf2 --cov-report term-missing
+
+ - name: Upload sdist tarball
+ if: runner.os == 'Linux'
+ uses: actions/upload-artifact at v4
+ with:
+ name: sdist
+ path: dist/cyvcf2-*.tar.gz
+ retention-days: 7
=====================================
.github/workflows/wheels.yml
=====================================
@@ -5,138 +5,141 @@ on:
branches:
- main
tags:
- - 'v*.*.*'
+ - "v*.*.*"
workflow_dispatch:
inputs:
debug_enabled:
- description: 'Run the build with tmate debugging enabled (https://github.com/marketplace/actions/debugging-with-tmate)'
+ description: "Run the build with tmate debugging enabled (https://github.com/marketplace/actions/debugging-with-tmate)"
required: false
default: false
schedule:
# run weekly on a Monday
- - cron: '0 0 * * 1'
+ - cron: "0 0 * * 1"
jobs:
build_wheels:
- name: Build wheels on ${{ matrix.os }}
- runs-on: ${{ matrix.os }}
+ name: Build wheels for ${{ matrix.python-version }}-${{ matrix.buildplat[1] }}
+ runs-on: ${{ matrix.buildplat[0] }}
strategy:
matrix:
- os: [ubuntu-20.04, macos-latest]
+ buildplat:
+ - [ubuntu-22.04, manylinux_x86_64]
+ - [ubuntu-22.04, musllinux_x86_64]
+ - [ubuntu-22.04, manylinux_aarch64]
+ - [ubuntu-22.04, musllinux_aarch64]
+ - [macos-12, macosx_x86_64]
+ - [macos-12, macosx_arm64]
+ python-version: [pp310, cp37, cp38, cp39, cp310, cp311, cp312]
+ exclude:
+ # pp310, cp37, cp38 on musllinux is not support
+ # cp39, cp310 on musllinux_aarch64, wheel building may hangup, ignore it
+ - buildplat: [ubuntu-22.04, musllinux_x86_64]
+ python-version: cp37
+ - buildplat: [ubuntu-22.04, musllinux_x86_64]
+ python-version: cp38
+ - buildplat: [ubuntu-22.04, musllinux_x86_64]
+ python-version: pp310
+ - buildplat: [ubuntu-22.04, musllinux_aarch64]
+ python-version: cp37
+ - buildplat: [ubuntu-22.04, musllinux_aarch64]
+ python-version: cp38
+ - buildplat: [ubuntu-22.04, musllinux_aarch64]
+ python-version: cp39
+ - buildplat: [ubuntu-22.04, musllinux_aarch64]
+ python-version: cp310
+ - buildplat: [ubuntu-22.04, musllinux_aarch64]
+ python-version: pp310
+ # cp37, pp310 on macos arm64 is not supported
+ - buildplat: [macos-12, macosx_arm64]
+ python-version: cp37
+ - buildplat: [macos-12, macosx_arm64]
+ python-version: pp310
steps:
- - uses: actions/checkout at v3
- with:
- submodules: true
- - uses: actions/setup-python at v4
- name: Install Python
- with:
- python-version: "3.12"
-
- - name: Install cibuildwheel
- run: |
- python -m pip install -U cibuildwheel
-
- - name: Build wheels for Linux
- if: matrix.os == 'ubuntu-20.04'
- run: |
- python -m cibuildwheel --output-dir wheelhouse
- env:
- CIBW_SKIP: "pp* *i686* *musllinux*"
- CIBW_MANYLINUX_X86_64_IMAGE: manylinux2014
- CIBW_BEFORE_BUILD_LINUX: "{project}/ci/linux-deps"
- CIBW_TEST_COMMAND: "{project}/ci/test"
- CIBW_ENVIRONMENT: "CYTHONIZE=1 LIBDEFLATE=1 LDFLAGS='-L/usr/lib64/openssl11' CPPFLAGS='-I/usr/include/openssl11' C_INCLUDE_PATH='/root/include' LIBRARY_PATH='/root/lib'"
- CIBW_REPAIR_WHEEL_COMMAND_LINUX: LD_LIBRARY_PATH='/root/lib' auditwheel repair -w {dest_dir} {wheel}
-
- - name: Build wheels for Mac OS x86
- if: matrix.os == 'macos-latest'
- run: |
- python -m cibuildwheel --output-dir wheelhouse
- env:
- CIBW_SKIP: "pp* *i686*"
- CIBW_ARCHS_MACOS: "x86_64"
- CIBW_MANYLINUX_X86_64_IMAGE: manylinux2014
- CIBW_BEFORE_BUILD_MACOS: "{project}/ci/osx-deps"
- CIBW_TEST_COMMAND: "{project}/ci/test"
- CIBW_ENVIRONMENT: "CYTHONIZE=1 LIBDEFLATE=1 C_INCLUDE_PATH='/usr/local/include' LIBRARY_PATH='/usr/local/lib'"
- # https://cibuildwheel.readthedocs.io/en/stable/faq/#macos-passing-dyld_library_path-to-delocate
- CIBW_REPAIR_WHEEL_COMMAND_MACOS: >
- DYLD_LIBRARY_PATH=/usr/local/lib delocate-listdeps {wheel} &&
- DYLD_LIBRARY_PATH=/usr/local/lib delocate-wheel --require-archs {delocate_archs} -w {dest_dir} {wheel}
- LDFLAGS: "-L/usr/local/opt/openssl at 1.1/lib"
- CPPFLAGS: "-I/usr/local/opt/openssl at 1.1/include"
- PKG_CONFIG_PATH: "/usr/local/opt/openssl at 1.1/lib/pkgconfig"
-
- - name: Build wheels for Mac OS arm64
- # don't build with libdeflate, see https://github.com/brentp/cyvcf2/issues/252
- if: matrix.os == 'macos-latest'
- run: |
- python -m cibuildwheel --output-dir wheelhouse
- env:
- CIBW_SKIP: "pp* *i686*"
- CIBW_ARCHS_MACOS: "arm64"
- CIBW_MANYLINUX_X86_64_IMAGE: manylinux2014
- CIBW_BEFORE_BUILD_MACOS: "{project}/ci/osx-arm64-deps"
- CIBW_TEST_COMMAND: "{project}/ci/test"
- CIBW_TEST_SKIP: "*-macosx_arm64"
- CIBW_ENVIRONMENT: "CYTHONIZE=1 C_INCLUDE_PATH='/usr/local/include' LIBRARY_PATH='/usr/local/lib'"
- # https://cibuildwheel.readthedocs.io/en/stable/faq/#macos-passing-dyld_library_path-to-delocate
- CIBW_REPAIR_WHEEL_COMMAND_MACOS: >
- DYLD_LIBRARY_PATH=/usr/local/lib delocate-listdeps {wheel} &&
- DYLD_LIBRARY_PATH=/usr/local/lib delocate-wheel --require-archs {delocate_archs} -w {dest_dir} {wheel}
- LDFLAGS: "-L/usr/local/opt/openssl at 1.1/lib"
- CPPFLAGS: "-I/usr/local/opt/openssl at 1.1/include"
- PKG_CONFIG_PATH: "/usr/local/opt/openssl at 1.1/lib/pkgconfig"
-
- # Enable tmate debugging of manually-triggered workflows if the input option was provided
- - name: Setup tmate session
- if: ${{ always() && github.event_name == 'workflow_dispatch' && github.event.inputs.debug_enabled == 'true' }}
- uses: mxschmitt/action-tmate at v3
-
- - uses: actions/upload-artifact at v2
- with:
- path: ./wheelhouse/*.whl
+ - uses: actions/checkout at v4
+ with:
+ submodules: recursive
+
+ - name: Set up QEMU
+ if: runner.os == 'Linux'
+ uses: docker/setup-qemu-action at v3
+
+ - name: Build wheels
+ uses: pypa/cibuildwheel at v2.16.4
+ with:
+ package-dir: .
+ output-dir: wheelhouse
+ config-file: "{package}/pyproject.toml"
+ env:
+ # select
+ CIBW_BUILD: ${{ matrix.python-version }}-${{ matrix.buildplat[1] }}
+
+ # linux
+ CIBW_MANYLINUX_X86_64_IMAGE: manylinux2014
+ # manylinux2014 can't build on aarch64
+ CIBW_MANYLINUX_AARCH64_IMAGE: manylinux_2_28
+ CIBW_MUSLLINUX_X86_64_IMAGE: musllinux_1_2
+ CIBW_MUSLLINUX_AARCH64_IMAGE: musllinux_1_2
+ CIBW_ARCHS_LINUX: auto64 aarch64
+ CIBW_BEFORE_BUILD_LINUX: "{project}/ci/linux-deps"
+ CIBW_REPAIR_WHEEL_COMMAND_LINUX: 'LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/usr/local/lib64" && auditwheel repair -w {dest_dir} {wheel}'
+
+ # macos
+ CIBW_ARCHS_MACOS: auto64 arm64
+ CIBW_BEFORE_BUILD_MACOS: "{project}/ci/osx-deps"
+
+ # build
+ CIBW_ENVIRONMENT: >-
+ CYVCF2_HTSLIB_CONFIGURE_OPTIONS="--enable-libcurl --enable-s3 --enable-lzma --enable-bz2 --with-libdeflate"
+ CYTHONIZE=1
+ CIBW_TEST_COMMAND: "{project}/ci/test"
+ # macOS build arm64 on x86_64 with cross-compiler, not support test
+ CIBW_TEST_SKIP: "*-macosx_arm64"
+
+ # Enable tmate debugging of manually-triggered workflows if the input option was provided
+ - name: Setup tmate session
+ if: ${{ always() && github.event_name == 'workflow_dispatch' && github.event.inputs.debug_enabled == 'true' }}
+ uses: mxschmitt/action-tmate at v3
+
+ - uses: actions/upload-artifact at v4
+ with:
+ name: artifact-${{ matrix.python-version }}-${{ matrix.buildplat[1] }}
+ path: ./wheelhouse/*.whl
build_sdist:
name: Build source distribution
- runs-on: ubuntu-latest
+ runs-on: ubuntu-22.04
steps:
- - uses: actions/checkout at v2
-
- - uses: actions/setup-python at v4
+ - uses: actions/checkout at v4
+ with:
+ submodules: recursive
+ - uses: actions/setup-python at v5
name: Install Python
with:
python-version: "3.12"
- name: Install dependencies
run: |
- sudo apt-get update
- sudo apt-get install libcurl4-openssl-dev libbz2-dev liblzma-dev libssl-dev
- git submodule update --init --recursive
- cd htslib
- autoheader && autoconf && autoreconf --install
- ./configure --enable-libcurl --enable-s3 --enable-lzma --enable-bz2
- make
- cd ..
pip install -r requirements.txt
- name: Build sdist
run: CYTHONIZE=1 python setup.py sdist
- - uses: actions/upload-artifact at v2
+ - uses: actions/upload-artifact at v4
with:
+ name: artifact-sdist
path: dist/*.tar.gz
upload_pypi:
needs: [build_wheels, build_sdist]
- runs-on: ubuntu-latest
+ runs-on: ubuntu-22.04
# upload to PyPI on every tag starting with 'v'
if: github.event_name == 'push' && startsWith(github.event.ref, 'refs/tags/v')
steps:
- - uses: actions/download-artifact at v2
+ - uses: actions/download-artifact at v4
with:
- name: artifact
+ pattern: artifact-*
+ merge-multiple: true
path: dist
- uses: pypa/gh-action-pypi-publish at release/v1
=====================================
.gitignore
=====================================
@@ -19,3 +19,4 @@ _templates
setup-requires/*
.cache/v/cache/lastfailed
.idea
+**/__pycache__
=====================================
CHANGES.md
=====================================
@@ -1,3 +1,8 @@
+# v0.30.27
+
++ support num_records using index stats (#295 from @jeromekelleher)
++ don't remove htslib/config.status (#296)
+
# v0.30.25
+ bump to get new release for CI/wheel fixes. thanks to @graphenn (#286) and @oyvinev (#297)
=====================================
MANIFEST.in
=====================================
@@ -1,12 +1,18 @@
-include cyvcf2/tests/*
include LICENSE
+include *.md
include cyvcf2/*.pyx
include cyvcf2/*.pxd
-include cyvcf2/*.c
-include cyvcf2/*.h
-include *.md
-include htslib/*.c
-include htslib/*.h
-include htslib/htslib/*.h
-include htslib/cram/*.c
-include htslib/cram/*.h
+include cyvcf2/*.[ch]
+
+# exclude tests from pypi because no data file
+prune cyvcf2/tests
+
+# htslib
+include htslib/LICENSE htslib/README
+recursive-include htslib *.[ch]
+exclude htslib/*config*.h
+
+include htslib/configure.ac htslib/m4/*.m4 htslib/*.in
+include htslib/configure htslib/version.sh
+include htslib/Makefile htslib/*.mk
+exclude htslib/config.mk htslib/htscodecs.mk
=====================================
README.md
=====================================
@@ -14,7 +14,7 @@ If you use cyvcf2, please cite the [paper](https://academic.oup.com/bioinformati
Fast python **(2 and 3)** parsing of VCF and BCF including region-queries.
-[![Build Status](https://github.com/brentp/cyvcf2/workflows/Build/badge.svg)](https://github.com/brentp/cyvcf2/actions?query=workflow%3ABuild)
+[![Build](https://github.com/brentp/cyvcf2/actions/workflows/build.yml/badge.svg)](https://github.com/brentp/cyvcf2/actions/workflows/build.yml)
cyvcf2 is a cython wrapper around [htslib](https://github.com/samtools/htslib) built for fast parsing of [Variant Call Format](https://en.m.wikipedia.org/wiki/Variant_Call_Format) (VCF) files.
@@ -70,24 +70,35 @@ for v in vcf('11:435345-556565'):
Installation
============
-## pip (assuming you have htslib < 1.10 installed)
+## pip with bundled htslib
```
pip install cyvcf2
```
+## pip with system htslib
+
+Assuming you have already built and installed htslib version 1.12 or higher.
+```
+CYVCF2_HTSLIB_MODE=EXTERNAL pip install --no-binary cyvcf2 cyvcf2
+```
+
+## windows (experimental, only test on MSYS2)
+
+Assuming you have already built and installed htslib.
+```
+SETUPTOOLS_USE_DISTUTILS=stdlib pip install cyvcf2
+```
+
## github (building htslib and cyvcf2 from source)
```
git clone --recursive https://github.com/brentp/cyvcf2
-cd cyvcf2/htslib
-autoheader
-autoconf
-./configure --enable-libcurl
-make
-
-cd ..
pip install -r requirements.txt
-CYTHONIZE=1 pip install -e .
+# sometimes it can be required to remove old files:
+# python setup.py clean_ext
+CYVCF2_HTSLIB_MODE=BUILTIN CYTHONIZE=1 python setup.py install
+# or to use a system htslib.so
+CYVCF2_HTSLIB_MODE=EXTERNAL python setup.py install
```
On **OSX**, using brew, you may have to set the following as indicated by the brew install:
=====================================
ci/Dockerfile.alpine.test
=====================================
@@ -0,0 +1,15 @@
+ARG PYTHON_VERSION=alpine
+
+FROM python:${PYTHON_VERSION}
+
+WORKDIR /workspace
+
+RUN apk add --no-cache build-base autoconf automake git xz-dev curl-dev libdeflate-dev bzip2-dev
+
+COPY . .
+
+RUN pip install -r requirements.txt && pip install pytest pytest-cov
+
+# build cyvcf2
+RUN CYVCF2_HTSLIB_CONFIGURE_OPTIONS="--enable-libcurl --enable-s3 --enable-lzma --enable-bz2 --with-libdeflate" \
+ CYTHONIZE=1 python setup.py build_ext -i
=====================================
ci/Dockerfile.test → ci/Dockerfile.slim.test
=====================================
@@ -4,17 +4,14 @@ FROM python:${PYTHON_VERSION}
WORKDIR /workspace
-RUN apt-get update && apt-get install --no-install-recommends -y autoconf automake gcc \
- libcurl4-openssl-dev make git libc6-dev zlib1g-dev libssl-dev liblzma-dev libbz2-dev && \
+RUN apt-get update && apt-get install --no-install-recommends -y autoconf automake gcc libcurl4-openssl-dev \
+ make git libc6-dev zlib1g-dev libssl-dev liblzma-dev libbz2-dev libdeflate-dev && \
rm -rf /var/lib/apt/lists/*
COPY . .
-# build htslib
-RUN cd htslib && autoheader && autoconf && autoreconf --install && \
- ./configure --enable-s3 --disable-lzma --disable-bz2 && make
-
RUN pip install -r requirements.txt && pip install pytest pytest-cov
# build cyvcf2
-RUN CYTHONIZE=1 python setup.py build_ext -i
+RUN CYVCF2_HTSLIB_CONFIGURE_OPTIONS="--enable-libcurl --enable-s3 --enable-lzma --enable-bz2 --with-libdeflate" \
+ CYTHONIZE=1 python setup.py build_ext -i
=====================================
ci/linux-deps
=====================================
@@ -1,44 +1,43 @@
#!/bin/bash
-set -e
-
-yum install -y openssl11-devel
-yum install -y libffi libffi-devel zlib-devel
-yum install -y bzip2-devel bzip2-libs xz-devel xz-libs
-
-git submodule init
-git submodule update
-git submodule update --init --recursive
-
-curl -L -O https://www.libssh2.org/download/libssh2-1.9.0.tar.gz
-tar xzf libssh2-1.9.0.tar.gz
-cd libssh2-1.9.0
-./configure --prefix=/root
-make
-make install
-cd ..
-rm -rf libssh2-1.9.0
-
-curl -L -O https://curl.se/download/curl-7.73.0.tar.gz
-tar xzf curl-7.73.0.tar.gz
-cd curl-7.73.0
-./configure --with-libssh2 --prefix=/root
-make
-make install
-cd ..
-rm -rf curl-7.73.0
-
-curl -L -o libdeflate-v1.8.tar.gz https://github.com/ebiggers/libdeflate/archive/refs/tags/v1.8.tar.gz
-tar xzf libdeflate-v1.8.tar.gz
-cd libdeflate-1.8
-make
-make install PREFIX=/root
-cd ..
-
-cd htslib
-# configure fails with autoconf 2.71 (in /usr/local/bin), so use 2.69 (in /usr/bin)
-/usr/bin/autoconf -V
-/usr/bin/autoheader
-/usr/bin/autoconf
-./configure --enable-libcurl --enable-s3 --enable-lzma --enable-bz2
-make
+# Configure the libraries needed to build wheel packages on linux.
+# This script is designed to be used by cibuildwheel as CIBW_BEFORE_ALL_LINUX
+
+set -euo pipefail
+
+# dir="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+
+source /etc/os-release
+
+echo "manylinux image woking on $ID"
+
+# Install cyvcf2 development files.
+case "$ID" in
+almalinux)
+ dnf install -y bzip2-devel xz-devel libcurl-devel openssl-devel openblas-devel epel-release
+
+ # packages at epel
+ dnf install -y libdeflate-devel
+ ;;
+
+alpine)
+ apk add --no-cache xz-dev curl-dev libdeflate-dev
+ ;;
+
+centos)
+ yum install -y bzip2-devel xz-devel libcurl-devel openssl-devel
+
+ LIBDEFLATE_VERSION=1.19
+ curl -L -o libdeflate-v"$LIBDEFLATE_VERSION".tar.gz https://github.com/ebiggers/libdeflate/archive/refs/tags/v"$LIBDEFLATE_VERSION".tar.gz
+ tar xzf libdeflate-v"$LIBDEFLATE_VERSION".tar.gz
+ cd libdeflate-"$LIBDEFLATE_VERSION"
+ cmake -B build && cmake --build build
+ cd ./build/ && make install
+ cd ../..
+ ;;
+
+*)
+ echo "$0: unexpected Linux distribution: '$ID'" >&2
+ exit 1
+ ;;
+esac
=====================================
ci/osx-arm64-deps deleted
=====================================
@@ -1,19 +0,0 @@
-#!/bin/bash
-
-set -e
-
-git submodule init
-git submodule update
-git submodule update --init --recursive
-
-# configure fails with autoconf 2.71, so downgrade
-# see https://github.com/asdf-vm/asdf-erlang/issues/195
-brew install autoconf at 2.69 && \
-brew link --overwrite autoconf at 2.69 && \
-autoconf -V
-
-cd htslib
-autoheader
-autoconf
-./configure --enable-libcurl --enable-s3 --enable-lzma --enable-bz2 --without-libdeflate
-make
=====================================
ci/osx-deps
=====================================
@@ -1,26 +1,26 @@
#!/bin/bash
-set -e
+set -euo pipefail
-git submodule init
-git submodule update
-git submodule update --init --recursive
+export DYLD_LIBRARY_PATH=/usr/local/lib
+# same with python
+export MACOSX_DEPLOYMENT_TARGET=10.9
-# configure fails with autoconf 2.71, so downgrade
-# see https://github.com/asdf-vm/asdf-erlang/issues/195
-brew install autoconf at 2.69 && \
-brew link --overwrite autoconf at 2.69 && \
-autoconf -V
+brew install automake
+brew unlink xz
-curl -L -o libdeflate-v1.8.tar.gz https://github.com/ebiggers/libdeflate/archive/refs/tags/v1.8.tar.gz
-tar xzf libdeflate-v1.8.tar.gz
-cd libdeflate-1.8
-make
-make install
-cd ..
+# build liblzma and libdelfate for muti arch
-cd htslib
-autoheader
-autoconf
-./configure --enable-libcurl --enable-s3 --enable-lzma --enable-bz2
-make
+XZ_VERSION=5.4.5
+curl -L -o xz-$XZ_VERSION.tar.gz "https://github.com/tukaani-project/xz/releases/download/v$XZ_VERSION/xz-$XZ_VERSION.tar.gz"
+tar -xf xz-$XZ_VERSION.tar.gz
+cd xz-$XZ_VERSION
+cmake -B build && cmake --build build
+cd ./build && make install
+
+LIBDEFLATE_VERSION=1.19
+curl -L -o libdeflate-v"$LIBDEFLATE_VERSION".tar.gz https://github.com/ebiggers/libdeflate/archive/refs/tags/v"$LIBDEFLATE_VERSION".tar.gz
+tar xzf libdeflate-v"$LIBDEFLATE_VERSION".tar.gz
+cd libdeflate-"$LIBDEFLATE_VERSION"
+cmake -B build && cmake --build build
+cd ./build && make install
=====================================
cyvcf2/__init__.py
=====================================
@@ -2,4 +2,4 @@ from .cyvcf2 import (VCF, Variant, Writer, r_ as r_unphased, par_relatedness,
par_het)
Reader = VCFReader = VCF
-__version__ = "0.30.25"
+__version__ = "0.30.28"
=====================================
cyvcf2/cyvcf2.pxd
=====================================
@@ -1,8 +1,11 @@
-from libc.stdint cimport int64_t, int32_t, uint32_t, int8_t, int16_t, uint8_t
+from libc.stdint cimport int64_t, uint64_t, int32_t, uint32_t, int8_t, int16_t, uint8_t
import numpy as np
cimport numpy as np
np.import_array()
+cdef extern from "string.h":
+ void* memcpy(void* dest, const void* src, size_t n)
+
cdef extern from "relatedness.h":
int related(int *gt_types, double *asum, int32_t *N, int32_t *ibs0,
int32_t *ibs2, int32_t n_samples)
@@ -67,15 +70,23 @@ cdef extern from "htslib/hts.h":
hts_idx_t *bcf_index_load(char *fn)
hts_idx_t *hts_idx_load2(const char *fn, const char *fnidx);
+ int hts_idx_nseq(const hts_idx_t *idx);
+ int hts_idx_get_stat(const hts_idx_t* idx, int tid, uint64_t* mapped,
+ uint64_t* unmapped);
#int hts_itr_next(BGZF *fp, hts_itr_t *iter, void *r, void *data);
void hts_itr_destroy(hts_itr_t *iter);
void hts_idx_destroy(hts_idx_t *idx);
cdef extern from "htslib/tbx.h":
+ ctypedef struct tbx_conf_t:
+ pass
+ # Expose details of tbx_t so that we can access the idx field
ctypedef struct tbx_t:
- pass
+ tbx_conf_t conf
+ hts_idx_t *idx
+ void *dict
tbx_t *tbx_index_load(const char *fn);
tbx_t *tbx_index_load2(const char *fn, const char *fnidx);
=====================================
cyvcf2/cyvcf2.pyx
=====================================
@@ -124,6 +124,24 @@ def r_(int32_t[::view.contiguous] a_gts, int32_t[::view.contiguous] b_gts, float
return r_unphased(&a_gts[0], &b_gts[0], f, n_samples)
+cdef char* pystring_to_cstring(str py_string):
+ # Convert Python string to byte string using UTF-8 encoding
+ cdef bytes byte_string = py_string.encode('utf-8') # Convert Python string to bytes
+ # Convert Python bytes to a C-compatible pointer
+ cdef const char* byte_string_ptr = byte_string
+
+ # Allocate memory for C string with size equal to byte string length plus null terminator
+ cdef size_t length = len(byte_string) + 1 # Plus 1 for the null terminator
+ cdef char* c_string = <char*>stdlib.malloc(length)
+ # return NULL if memory allocation fails
+ if c_string == NULL:
+ return c_string
+ # Copy byte string to C string using memcpy and add null terminator
+ memcpy(c_string, byte_string_ptr, length - 1) # Use memcpy to copy bytes to C string
+ c_string[length - 1] = b'\0' # Add null terminator to the end of the C string
+ return c_string
+
+
cdef set_constants(VCF v):
v.HOM_REF = 0
v.HET = 1
@@ -199,12 +217,14 @@ cdef class HTSFile:
"%s is not valid text_format or binary_format (format: %s mode: %s)" % (fname, self.hts.format.format, mode)
)
- def close(self):
+ cdef _c_close(self):
if self.hts != NULL:
if self.from_path:
hts_close(self.hts)
self.hts = NULL
+ def close(self):
+ self._c_close()
cdef class VCF(HTSFile):
"""
@@ -385,6 +405,14 @@ cdef class VCF(HTSFile):
raise Exception("unable to update to header")
def set_index(self, index_path=""):
+ # Clear any existing indexes
+ if self.idx != NULL:
+ tbx_destroy(self.idx)
+ self.idx = NULL
+ if self.hidx != NULL:
+ hts_idx_destroy(self.hidx)
+ self.hidx = NULL
+
if index_path.endswith(".tbi"):
self.idx = tbx_index_load2(to_bytes(self.fname), to_bytes(index_path))
if self.idx != NULL:
@@ -567,7 +595,9 @@ cdef class VCF(HTSFile):
if self.hdr != NULL:
bcf_hdr_destroy(self.hdr)
self.hdr = NULL
- self.close()
+
+ # Shouldn't call Python-space functions here
+ self._c_close()
if self.idx != NULL:
tbx_destroy(self.idx)
if self.hidx != NULL:
@@ -626,28 +656,73 @@ cdef class VCF(HTSFile):
stdlib.free(sls)
return self._seqlens
+ cdef _open_index(self):
+ """
+ Try to open an index, if not open already.
+ """
+ if self.hidx == NULL and self.idx == NULL:
+ if self.fname.decode(ENC).endswith(('.bcf', '.bcf.gz')):
+ self.hidx = bcf_index_load(self.fname)
+ else:
+ self.idx = tbx_index_load(to_bytes(self.fname))
+
property seqnames:
"list of chromosomes in the VCF"
def __get__(self):
if len(self._seqnames) > 0: return self._seqnames
- cdef char **cnames
+ cdef const char **cnames
cdef int i, n = 0
cnames = bcf_hdr_seqnames(self.hdr, &n)
- if n == 0 and self.fname.decode(ENC).endswith(('.bcf', '.bcf.gz')):
- if self.hidx == NULL:
- self.hidx = bcf_index_load(self.fname)
+ if n == 0:
+ self._open_index()
if self.hidx != NULL:
cnames = bcf_index_seqnames(self.hidx, self.hdr, &n)
- elif n == 0:
- if self.idx == NULL:
- self.idx = tbx_index_load(to_bytes(self.fname))
if self.idx !=NULL:
cnames = tbx_seqnames(self.idx, &n)
-
self._seqnames = [cnames[i].decode() for i in range(n)]
stdlib.free(cnames)
return self._seqnames
+ cdef _num_records(self):
+ cdef uint64_t total, records, v;
+ cdef int ret, tid, nseq;
+ cdef hts_idx_t *idx = NULL;
+
+ self._open_index()
+ if self.hidx != NULL:
+ idx = self.hidx
+ assert self.idx == NULL
+ if self.idx != NULL:
+ idx = self.idx.idx
+ assert self.hidx == NULL
+
+ if idx == NULL:
+ raise ValueError(
+ "File must be indexed to compute num_records (tip: use bcftools index)")
+
+ nseq = hts_idx_nseq(idx)
+ total = 0;
+ for tid in range(nseq):
+ # NOTE: the return value here doesn't seem to indicate an error
+ # condition, and correct values are computed when it returns < 0.
+ # bcftools index -n doesn't strictly check the output.
+ hts_idx_get_stat(idx, tid, &records, &v);
+ total += records
+ return total
+
+ property num_records:
+ """
+ The number of VCF records in the file, computed from the index.
+ If the file is not indexed (or an index has not been set using
+ ``set_index``) a ValueError is raised.
+
+ Note that incorrect values may be returned if a mismatched
+ index file (i.e., the index for a different VCF file) is used.
+ This is not detected as an error condition.
+ """
+ def __get__(self):
+ return self._num_records()
+
def plot_relatedness(self, riter):
import pandas as pd
from matplotlib import pyplot as plt
@@ -2379,19 +2454,29 @@ cdef class Writer(VCF):
def variant_from_string(self, variant_string):
cdef bcf1_t *b = bcf_init()
cdef kstring_t s
- tmp = to_bytes(variant_string)
- s.s = tmp
- s.l = len(variant_string)
- s.m = len(variant_string)
+
+ # vcf_parse may realloc s.s, so the memory must be created by malloc
+ s.s = pystring_to_cstring(variant_string)
+ if s.s == NULL:
+ bcf_destroy(b)
+ raise MemoryError("Failed to allocate memory")
+
+ # plus 1 for '\0' of cstring
+ s.l = len(variant_string) + 1
+ s.m = len(variant_string) + 1
+
ret = vcf_parse(&s, self.hdr, b)
if ret > 0:
bcf_destroy(b)
+ ks_free(&s)
raise Exception("error parsing:" + variant_string + " return value:" + ret)
var = newVariant(b, self)
if var.b.errcode == BCF_ERR_CTG_UNDEF:
self.add_to_header("##contig=<ID=%s>" % var.CHROM)
var.b.errcode = 0
+
+ ks_free(&s)
return var
def write_header(Writer self):
=====================================
cyvcf2/helpers.c
=====================================
@@ -4,10 +4,9 @@
int as_gts(int32_t *gts, int num_samples, int ploidy, int strict_gt, int HOM_ALT, int UNKNOWN) {
int j = 0, i, k;
- int missing= 0, found=0;
+ int missing= 0;
for (i = 0; i < ploidy * num_samples; i += ploidy){
missing = 0;
- found = 0;
for (k = 0; k < ploidy; k++) {
if bcf_gt_is_missing(gts[i+k]) {
missing += 1;
=====================================
cyvcf2/tests/multi-contig.bcf
=====================================
Binary files /dev/null and b/cyvcf2/tests/multi-contig.bcf differ
=====================================
cyvcf2/tests/multi-contig.bcf.csi
=====================================
Binary files /dev/null and b/cyvcf2/tests/multi-contig.bcf.csi differ
=====================================
cyvcf2/tests/multi-contig.vcf.gz
=====================================
Binary files /dev/null and b/cyvcf2/tests/multi-contig.vcf.gz differ
=====================================
cyvcf2/tests/multi-contig.vcf.gz.csi
=====================================
Binary files /dev/null and b/cyvcf2/tests/multi-contig.vcf.gz.csi differ
=====================================
cyvcf2/tests/multi-contig.vcf.gz.tbi
=====================================
Binary files /dev/null and b/cyvcf2/tests/multi-contig.vcf.gz.tbi differ
=====================================
cyvcf2/tests/test_reader.py
=====================================
@@ -1,5 +1,6 @@
from __future__ import print_function
import os.path
+import platform
import tempfile
import sys
import os
@@ -965,13 +966,20 @@ def test_alt_homozygous_gt():
assert v.gt_bases[0] == '<*:DEL>/<*:DEL>'
def test_write_missing_contig():
- input_vcf = VCF('{}/seg.vcf.gz'.format(HERE))
- output_vcf = Writer('/dev/null', input_vcf)
+ input_vcf = VCF("{}/seg.vcf.gz".format(HERE))
+ if platform.system() == "Windows":
+ output_vcf = "__o.vcf"
+ else:
+ output_vcf = "/dev/null"
+ output_vcf = Writer(output_vcf, input_vcf)
for v in input_vcf:
- v.genotypes = [[1,1,False]]
+ v.genotypes = [[1, 1, False]]
output_vcf.write_record(v)
output_vcf.close()
+ if platform.system() == "Windows":
+ os.unlink("__o.vcf")
+
def test_set_samples():
vcf = VCF(VCF_PATH)
assert len(vcf.samples) == 189, len(vcf.samples)
@@ -1000,9 +1008,14 @@ def test_issue44():
# "./." "." ".|." "0|0"
expected = [[-1, -1, False], [-1, False], [-1, -1, True], [0, 0, True]]
#print("", file=sys.stderr)
- for i, v in enumerate(VCF('__o.vcf')):
+
+ t = VCF('__o.vcf')
+ for i, v in enumerate(t):
#print(v.genotypes, file=sys.stderr)
assert v.genotypes == [expected[i]], (i, v.genotypes, expected[i])
+
+ # file should be closed before delete
+ t.close()
os.unlink("__o.vcf")
def test_id_field_updates():
@@ -1283,7 +1296,7 @@ def test_genotypes():
[0, 0, 1, 1],
[1, 1, 0, 0],
[1, 1, 0, 0],
- ]
+ ]
strict_exp_num = [x[:] for x in non_strict_exp_num]
strict_exp_num[1] = [0, 0, 2, 0] # both unknown
@@ -1323,3 +1336,77 @@ def test_issue17_no_gt():
with pytest.raises(Exception):
for v in vcf:
v.num_called # Used to give segmentation fault
+
+
+ at pytest.mark.parametrize("path", [
+ "test.vcf.gz",
+ "test-multiallelic-homozygous-alt.vcf.gz",
+ "test-strict-gt-option-flag.vcf.gz",
+ "test-strict-gt-option-flag.vcf.gz",
+ "multi-contig.vcf.gz",
+ "multi-contig.bcf",
+ "test.snpeff.bcf",
+ ])
+def test_num_records_indexed(path):
+ vcf = VCF(os.path.join(HERE, path))
+ n = len(list(vcf))
+ assert n == vcf.num_records
+ vcf = VCF(os.path.join(HERE, path))
+ assert n == vcf.num_records
+
+ at pytest.mark.parametrize("suffix", ["csi", "tbi"])
+def test_num_records_indexed_csi_tabix(suffix):
+ path = "multi-contig.vcf.gz"
+ index_file = os.path.join(HERE, "multi-contig.vcf.gz.{}".format(suffix))
+ vcf = VCF(os.path.join(HERE, path))
+ n = len(list(vcf))
+ # Explicitly set the index
+ vcf.set_index(index_file)
+ assert n == vcf.num_records
+ vcf = VCF(os.path.join(HERE, path))
+ vcf.set_index(index_file)
+ assert n == vcf.num_records
+
+def test_num_records_set_index_multiple_times():
+ path = os.path.join(HERE, "multi-contig.vcf.gz")
+ csi_index = path + ".csi"
+ tbi_index = path + ".tbi"
+ vcf = VCF(path)
+ n = len(list(vcf))
+ assert n == vcf.num_records
+ vcf.set_index(csi_index)
+ assert n == vcf.num_records
+
+ vcf = VCF(path)
+ assert n == vcf.num_records
+ vcf.set_index(tbi_index)
+ assert n == vcf.num_records
+
+ vcf = VCF(path)
+ vcf.set_index(csi_index)
+ assert n == vcf.num_records
+
+ vcf = VCF(path)
+ for _ in range(10):
+ vcf.set_index(csi_index)
+ assert n == vcf.num_records
+ vcf.set_index(tbi_index)
+ assert n == vcf.num_records
+
+def test_num_records_set_wrong_index():
+ path = os.path.join(HERE, "multi-contig.vcf.gz")
+ index = os.path.join(HERE, "test.vcf.gz.tbi")
+ vcf = VCF(path)
+ vcf.set_index(index)
+ # We compute the number of records from the index, and don't report an
+ # error
+ assert vcf.num_records == 115
+ assert vcf.num_records != len(list(vcf))
+
+ at pytest.mark.parametrize("path", [
+ "test-genotypes.vcf",
+ ])
+def test_num_records_no_index(path):
+ vcf = VCF(os.path.join(HERE, path))
+ with pytest.raises(ValueError, match="must be indexed"):
+ vcf.num_records
=====================================
pyproject.toml
=====================================
@@ -1,2 +1,8 @@
[build-system]
-requires = ["setuptools", "wheel", "cython>=0.23.3", "oldest-supported-numpy"]
+requires = [
+ "setuptools",
+ "wheel",
+ "cython>=0.23.3",
+ 'oldest-supported-numpy; os_name != "nt"',
+ 'numpy; os_name == "nt"'
+]
=====================================
requirements.txt
=====================================
@@ -1,5 +1,6 @@
cython>=0.23.3
-numpy
coloredlogs
click
setuptools
+numpy; os_name == 'nt'
+oldest-supported-numpy; os_name != 'nt'
=====================================
setup.py
=====================================
@@ -1,13 +1,20 @@
-import os
+import ctypes
import glob
+import os
+import platform
+import shutil
import sys
import subprocess
-import platform
-from setuptools import setup, Extension
+from setuptools import setup, Extension, Command
+from setuptools.command.build_ext import build_ext
+from setuptools.command.sdist import sdist
if sys.version_info.major == 2 and sys.version_info.minor != 7:
- sys.stderr.write("ERROR: cyvcf2 is only for python 2.7 or greater you are running %d.%d\n", (sys.version_info.major, sys.version_info.minor))
+ sys.stderr.write(
+ "ERROR: cyvcf2 is only for python 2.7 or greater you are running %d.%d\n",
+ (sys.version_info.major, sys.version_info.minor),
+ )
sys.exit(1)
import numpy as np
@@ -18,15 +25,17 @@ def get_version():
import ast
with open(os.path.join("cyvcf2", "__init__.py"), "r") as init_file:
- module = ast.parse(init_file.read())
+ module = ast.parse(init_file.read())
- version = (ast.literal_eval(node.value) for node in ast.walk(module)
- if isinstance(node, ast.Assign)
- and node.targets[0].id == "__version__")
+ version = (
+ ast.literal_eval(node.value)
+ for node in ast.walk(module)
+ if isinstance(node, ast.Assign) and node.targets[0].id == "__version__"
+ )
try:
- return next(version)
+ return next(version)
except StopIteration:
- raise ValueError("version could not be located")
+ raise ValueError("version could not be located")
def no_cythonize(extensions, **_ignore):
@@ -41,30 +50,210 @@ def no_cythonize(extensions, **_ignore):
return extensions
+def check_libhts():
+ os_type = platform.system()
+ if os_type == "Linux":
+ lib_name = "libhts.so"
+ elif os_type == "Darwin": # macOS
+ lib_name = "libhts.dylib"
+ elif os_type == "Windows":
+ lib_name = "hts-3.dll"
+ else:
+ return False # Unsupported OS
+
+ try:
+ ctypes.CDLL(lib_name)
+ return True
+ except Exception:
+ return False
+
+
+def build_htslib(htslib_configure_options, static_mode):
+ current_directory = os.getcwd()
+ os.chdir(os.path.join(current_directory, "htslib"))
+
+ if os.path.exists("config.status"):
+ print("# cyvcf2: config.status exists, skip configure htslib")
+ else:
+ subprocess.run(["autoreconf", "-i"], check=True)
+
+ configure_args = ["./configure"]
+ if static_mode:
+ configure_args.append("CFLAGS=-fPIC")
+ if htslib_configure_options:
+ configure_args.extend(htslib_configure_options.split())
+
+ subprocess.run(configure_args, check=True)
+ subprocess.run(["make"], check=True)
+
+ os.chdir(current_directory)
+
+
+def pre_sdist():
+ current_directory = os.getcwd()
+ os.chdir(os.path.join(current_directory, "htslib"))
+
+ # generate version.h
+ subprocess.run(["make", "htscodecs/htscodecs/version.h"], check=True)
+
+ # remove redundant file
+ redudant_files = ["htscodecs.mk"]
+ for redudant_file in redudant_files:
+ if os.path.exists(redudant_file):
+ os.remove(redudant_file)
+
+ os.chdir(current_directory)
+
+
+class cyvcf2_build_ext(build_ext):
+ def run(self):
+ print("# cyvcf2: htslib mode is {}".format(CYVCF2_HTSLIB_MODE))
+ if CYVCF2_HTSLIB_MODE == "BUILTIN" or not check_libhts():
+ if platform.system() == "Windows":
+ # Windows htslib can't be built internall
+ raise RuntimeError(
+ "Required library 'hts-3.dll' not found. Please install htslib first."
+ )
+
+ print(
+ "# cyvcf2: htslib configure options is {}".format(
+ CYVCF2_HTSLIB_CONFIGURE_OPTIONS
+ )
+ )
+ build_htslib(
+ CYVCF2_HTSLIB_CONFIGURE_OPTIONS, CYVCF2_HTSLIB_MODE == "BUILTIN"
+ )
+
+ if CYVCF2_HTSLIB_MODE == "BUILTIN":
+ # add htslib linked libraries
+ # libcrypto is bundled with libssl, capabale to replace libssl
+ all_dynamic_libs = {
+ "z",
+ "bz2",
+ "lzma",
+ "curl",
+ "deflate",
+ "crypto",
+ }
+
+ extra_libs = []
+ # read the htslib config.status file to get the linked libraries
+ with open(os.path.join("htslib", "config.status"), "r") as f:
+ for line in f:
+ if 'S["static_LIBS"]' in line:
+ linked_libs_str = line.split("=")[1].strip()[1:-1]
+ print("# cyvcf2: htslib librarys is {}".format(linked_libs_str))
+ linked_libs = linked_libs_str.split()
+ for lib in linked_libs:
+ if lib[2:] in all_dynamic_libs: # remove -l prefix
+ extra_libs.append(lib[2:])
+
+ self.extensions[0].libraries = self.extensions[0].libraries + extra_libs
+
+ super().run()
+
+
+class cyvcf2_sdist(sdist):
+ def run(self):
+ if platform.system() == "Windows":
+ raise RuntimeError("cyvcf2 Can't build sdist on Windows")
+
+ pre_sdist()
+
+ super().run()
+
+
+class clean_ext(Command):
+ description = "clean up Cython temporary files and htslib build files"
+ user_options = []
+
+ def initialize_options(self):
+ pass
+
+ def finalize_options(self):
+ pass
+
+ def run(self):
+ print("cleaning build files")
+ if os.path.exists("build"):
+ shutil.rmtree("build")
+
+ if os.path.exists("cyvcf2.egg-info"):
+ shutil.rmtree("cyvcf2.egg-info")
+
+ print("cleaning Cython temporary files")
+ cyvcf2_c_path = os.path.join("cyvcf2", "cyvcf2.c")
+ if os.path.exists(cyvcf2_c_path):
+ os.remove(cyvcf2_c_path)
+
+ lib_files = glob.glob("cyvcf2/cyvcf2.cpython-*")
+ for file in lib_files:
+ os.remove(file)
+
+ if platform.system() != "Windows":
+ print("cleaning htslib build files")
+ current_directory = os.getcwd()
+ os.chdir(os.path.join(current_directory, "htslib"))
+ subprocess.run(["make", "distclean"], check=True)
+ os.chdir(current_directory)
+
+
+# How to link against HTSLIB
+# BUILTIN: build and static link against htslib from
+# builtin htslib code (default)
+# EXTERNAL: use shared libhts.so compiled outside of
+# cyvcf2
+if platform.system() == "Windows":
+ # can't static link to htslib on Windows
+ htslib_mode_default = "EXTERNAL"
+else:
+ htslib_mode_default = "BUILTIN"
+
+CYVCF2_HTSLIB_MODE = os.environ.get("CYVCF2_HTSLIB_MODE", htslib_mode_default)
+
+if platform.system() == "Windows" and CYVCF2_HTSLIB_MODE == "BUILTIN":
+ print(
+ "# cyvcf2 WARNING: The use of cyvcf2 on Windows is experimental. It will not work when statically linked to htslib. Fallback to htslib EXTERNAL mode"
+ )
+ CYVCF2_HTSLIB_MODE = "EXTERNAL"
+
+CYVCF2_HTSLIB_CONFIGURE_OPTIONS = os.environ.get(
+ "CYVCF2_HTSLIB_CONFIGURE_OPTIONS", None
+)
+
+htslib_objects = []
+htslib_librarys = []
+htslib_library_dirs = []
+
+if CYVCF2_HTSLIB_MODE == "BUILTIN":
+ htslib_objects = ["htslib/libhts.a"]
+else:
+ htslib_librarys = ["hts"]
+ if not check_libhts():
+ htslib_library_dirs = ["htslib"]
+
+htslib_include_dirs = ["htslib", "htslib/htslib"]
+
# Build the Cython extension by statically linking to the bundled htslib
-sources = [
- x for x in glob.glob('htslib/*.c')
- if not any(e in x for e in ['irods', 'plugin'])
+sources = ["cyvcf2/cyvcf2.pyx", "cyvcf2/helpers.c"]
+
+extensions = [
+ Extension(
+ "cyvcf2.cyvcf2",
+ sources,
+ extra_objects=htslib_objects,
+ libraries=htslib_librarys,
+ extra_compile_args=[
+ "-Wno-sign-compare",
+ "-Wno-unused-function",
+ "-Wno-strict-prototypes",
+ "-Wno-unused-result",
+ "-Wno-discarded-qualifiers",
+ ],
+ include_dirs=["cyvcf2", np.get_include()] + htslib_include_dirs,
+ library_dirs=htslib_library_dirs,
+ )
]
-sources += glob.glob('htslib/cram/*.c')
-sources += glob.glob('htslib/htscodecs/htscodecs/*.c')
-# Exclude the htslib sources containing main()'s
-sources = [x for x in sources if not x.endswith(('htsfile.c', 'tabix.c', 'bgzip.c'))]
-sources.append('cyvcf2/helpers.c')
-
-extra_libs = []
-if platform.system() != 'Darwin':
- extra_libs.append('crypt')
-if bool(int(os.getenv("LIBDEFLATE", 0))):
- extra_libs.append('deflate')
-
-extensions = [Extension("cyvcf2.cyvcf2",
- ["cyvcf2/cyvcf2.pyx"] + sources,
- libraries=['z', 'bz2', 'lzma', 'curl', 'ssl'] + extra_libs,
- extra_compile_args=["-Wno-sign-compare", "-Wno-unused-function",
- "-Wno-strict-prototypes",
- "-Wno-unused-result", "-Wno-discarded-qualifiers"],
- include_dirs=['htslib', 'cyvcf2', np.get_include()])]
CYTHONIZE = bool(int(os.getenv("CYTHONIZE", 0)))
@@ -94,14 +283,19 @@ setup(
author_email="bpederse at gmail.com",
version=get_version(),
ext_modules=extensions,
- packages=['cyvcf2', 'cyvcf2.tests'],
+ packages=["cyvcf2"],
entry_points=dict(
console_scripts=[
- 'cyvcf2 = cyvcf2.__main__:cli',
+ "cyvcf2 = cyvcf2.__main__:cli",
],
),
python_requires=">=3.7",
- install_requires=['numpy', 'coloredlogs', 'click'],
+ install_requires=["numpy", "coloredlogs", "click"],
include_package_data=True,
zip_safe=False,
+ cmdclass={
+ "clean_ext": clean_ext,
+ "build_ext": cyvcf2_build_ext,
+ "sdist": cyvcf2_sdist,
+ },
)
View it on GitLab: https://salsa.debian.org/med-team/cyvcf2/-/commit/7c97cba877aefc2a8b60f5420cc24718b54eca8e
--
View it on GitLab: https://salsa.debian.org/med-team/cyvcf2/-/commit/7c97cba877aefc2a8b60f5420cc24718b54eca8e
You're receiving this email because of your account on salsa.debian.org.
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://alioth-lists.debian.net/pipermail/debian-med-commit/attachments/20240207/e4d79151/attachment-0001.htm>
More information about the debian-med-commit
mailing list