[med-svn] [Git][med-team/bcalm][master] Add some missing sources for tests

Shayan Doust gitlab at salsa.debian.org
Mon Sep 23 23:04:14 BST 2019



Shayan Doust pushed to branch master at Debian Med / bcalm


Commits:
f299ab0a by Shayan Doust at 2019-09-23T07:14:15Z
Add some missing sources for tests

- - - - -


4 changed files:

- + debian/missing-sources/compare_fasta.py
- + debian/missing-sources/reference.fasta
- + debian/missing-sources/simple_test.sh
- + debian/source/include-binaries


Changes:

=====================================
debian/missing-sources/compare_fasta.py
=====================================
@@ -0,0 +1,36 @@
+#very basic, one seq per line only, no pysam for max portability
+#doesn't care if sequences are in revcomp or forward order
+import sys
+
+fasta1 = sys.argv[1]
+fasta2 = sys.argv[2]
+
+revcomp = lambda x: ''.join([{'A':'T','C':'G','G':'C','T':'A'}[B] for B in x][::-1])
+def normalize(seq):
+    rev = revcomp(seq)
+    return min(rev,seq)
+
+def read_seqs(fasta):
+    seqs = set()
+    for  line in open(fasta):
+        if line[0] == '>': continue
+        seqs.add(normalize(line.strip()))
+    return seqs
+
+s1 = read_seqs(fasta1)
+s2 = read_seqs(fasta2)
+
+if s1 == s2:
+    sys.exit(0)
+
+if len(s1) == len(s2) and len(s1) == 1:
+    # special case, e.g. for read50 and genome10k, let's see if one is included in the other
+    seq1= s1.copy().pop()
+    seq2= s2.copy().pop()
+    if seq1 in seq2 or seq2 in seq1:
+        print("one seq is perfectly included in the other")
+    else:
+        print("BAD: one sequence doesn't exactly match the other")
+
+print("NOT EQUAL: %d sequence(s) in %s not in %s" % (len(s1.difference(s2)), fasta1, fasta2))
+sys.exit(1)


=====================================
debian/missing-sources/reference.fasta
=====================================
@@ -0,0 +1,10 @@
+>Seq0
+ACCTATAAGGATCCACGTCTTGATGTGACCGACGATGTTATCTGCCTATAGCGAACATTTCCTGGTAGGAATACTATTATATTACCTAAATTCTCCGGATTTCCGTGTTCTTCGGAAGCTTAGGTCACGCGCGTCATACTACAGTAAGTTACTGAATTTTGGAGTAATGCATATCGACCGAGTCCGGGGAATCGTCCGTATCCCCGCCAGGCGTATCCAATAATTAGGTCGGACCCCTAGCGCGTACGAGTCCTATAGCTGACATGCGAATTGGCCGTGCATCGAGCTCAAATGTCCTAGCTTGAGAGTGCGTATCTCACCGATCCCCTGGCTATGCTCCGCGATTCACTAGTAGTTTCACGCCGACAGAGCGAAACCGTGATAGGTCATCATGCCGGTCTGCAGTCACGTGCCCAGCAGTCTCCAATATAGCCACTTATGTCGGAATGTAATCGGCTCCAAATTACTGTGAACCTGATGATCGACGACGCGCTGGGTGCGGGATAGTGTAACTGTCCCGTATAAGGCTTAAATTGAGTATGCAGGATACACTTTTAGTATGACTCGGAAAATCCCACTACAGTATGAACCGTGACTGTCGTTGGGCGGTGCTTGTTGCTATTAACTGGATGGTAAGTCAATTTTAAGTGGAGCCCCCTGCAAGATGGAAGAGAACTATATGTGGAACCGGATGTCACGTCAAGACCACCGCGCACGCTTAACACAACGCATGGTTCGGCGACTGCTCCGGTTCTGGAATTCCTCTTTTTTATCGAGATTAGCATCTCATTAGCGCGCAGTGTGTCCTAGTGTCCCAGAACGTAAAGACCAGATTTGACATTAGTAAGTTGCATTCGCGGGTCTTTAGAGCTCCTACTAAGCCCATTCAGATTGAAAAAGGCGCGCCTGCGGTTCCATGTCATAGTTTAACTTGGTTGAGACGGCGCACGAAAGCATACTACCACCATCCATGTCAAAACTGGCGACGATCTTGCTGGGT
+>Seq1
+GTTTTATAACAAGTGAAGAAAGAACAGTCATTAGGCCCGAAGGCGTACACGGAATCCGCCTAAACTAATGCTTATGGTCCCTCGTAGGCCCCGACGGCATAGGGTGCCCCGTAATTGCGTAGACAGCGAAAGGAAAGTGTACCGACGACGAGATCAAGTGGCAGTGAACCCCTTGGAAAACTTCATATCGACAGACACTGTCCGAGTGATAAATCTACTATTCGCGGAACGGCTCCATAAACGGTGACTATGACCTCATCAGTTAAATTCATTAACCTATAGATGTTGAGAATCCGCCTAAATTGGAGGACGCCGCGCAAAGCCGGTCAACAGCGTTAGTATGTTGAAAGTTTACTCAGATCGCTTCTGTCGGCCTAAGTTATGAATACAGTCAGGGGTTTTCCTGGATACAGATCTTCGGAAGTCTGCTAGTGCCGGTCACGCCACGTATAAGACTAGAGACCTGACACTCATCTCGGACTGTAATTATTTTCTAAGCTAGCTGTCCTATTGTAAGGTAAGTCGGGGTGCCGGACCTTGGCAGCCGTCCGTACGTACATTAATGCATCAGACCAGTAATCTTGCTCGCTAGAGTCGGATCGGCGAGGTCCTCTCAGCTATGAAAAGTAGAATTCAGTCTTGCCCGGGGTAGGGCTAGAGACAAGGGTTGATATTGTCTGAAATGGCGCTCCCATCCGATAACTAAACTACCGTACGGGTGCACGCGAGTAGCCTTAATCCTGTTGGGAAGGAATTGCAATACTCTCCGAACCAGCTTAGGGCCCCCCGCCGCCGCAATTCGAGCGTTATGCCCGGAGCATTTGCACGATGCCATTAAACTATATCAACTACATATACTAGACTATCATCCTAGGGCGTAGAACTCCCTTTGCGTTACCACTCACAACGCGTGTGTTTCTCGTGCGGTGATCCCGGGAGTATTTTATCGGCGCCCCAACTGCCGGCAACTCGAGTGCACCGGAGCTGAGGAACGCTTCAC
+>Seq2
+TGCTGCCGATCGCTACGACGTCCTACCTTACACACAACGGGCCGCGTTCATACCCACGTATGAAGACATGCGGTTATCCGTTAGTTGGGGCCCGCGATGGCTGTTGTATGTAATGAGTGGAGTAAAAGAACACGGGAGATGTTCAATTAGGCTCAACCATTTGTATTGAAGGGGTCAAAACCCACCTGTGTAAGTAGCATTGAGTGCTGCTCATGGCCGATTCTCTTACTTTATTTAAGCCCATACCACTGATGGAGGAGACTCCAAGGAATAGTCCAACCGTTGTTCCGGGAAAAACGAACTCGGTCCGCTAGCGTGCTTGTCGTCGCAGCGCAGATTCCCTCCTAAGTTATTTTACCGGTTGACTCAGTCGCAGGGGTGCTGAACGCCATGGGGCGGACCGAGCGGAGATCTTTCAGGTGTAATTGGATGATCTTCACCCTAAGGAGGGAGCGGGTTATTGGGCAGGCCCGACCGCCGCTGGAAAGATGCAAGTATGAACAAGGCATGCGTAAGTTATCGTGAAACCATGATGGCCCCTTACTAGACCAAATGTACTGAATGCGTCTTGATTAGACCCCGAAAAGGCATATCACATCAACTTGTCGTGTTAGAGATGTCGCGAGAACCCTCGCCTATTCACGAAGTGCCCATGAGCCTTTGGGCCTGGTTGACAATATGCGCACCCTGTAGCCTACCAACCCTTCATAATCTATCTTCAATTTAGCCTGTCGAGAACGTCCTAACAAGGCTTTTGGCGCTCCAGATGGGACAGTCACTCTCTAGCATCAACCCATAGTTTTTGAGCTACCCGCCCTCGGTGAGAAGGTAGTATACCCAAACGCGTCCTATGCAGTTTTGGGCTTGAGGAACTAAAATCAATTCGTTAAGTCCAGTAGTCCTTATGTGTGGCCGTTCCAAGAATTAATCATATCGCGGAATCACCGGCGATTCATTTTCCGCACCAGAGCTTTCAGGTGCGGCGCGGCCCTAAAAGGTC
+>Seq3
+TATTGCGCCCTTCAAGAAGCTTCTGCTGACCGTAGGCGTCTCGGCGGTTTGTACTTTGAAAAATTAGCTGCACTACATCCGATGGGTATCCCTCCTCAATCTCAGCAGACCCGGAAAGCGATAGAATCAGCCACGCGGTCGTCCGGGCTAGGGGCCCTGCGCAAGGAAGGTTGGACAGGGCTAGACCCGGAAGCATCGGCTTTTCCTAAATGGTGACGGAGTTATATAGGGTAAGCCTGATAGCGCGGTAGGTGTAATGGCCATCCCCTCGCCTAGCGTGCGCGCAGACAAGTCCAGTCCCGGAGGAGGCATAGGCCTCATTATCATTTCCCTAGAATCGCTCTTGACATCTAGGTTGTACTAGGGACCAGGCGCCCAAAGCGGACGGTTCTCCGTGCTTTCGTGCCGTTTCAGCGTAAGATGCTATTTTTTGGGGAAATGGTCGGCGTGTGCGGGGGAGAACCACGGTACCAACTACGATAAGTCCGTCGTGTAACTTACGTGAAGGTGCTGTGAAGCAGGAATCCGTGCCAAAATGTCCGTGCGATATCCAACTTTCATAGTATTACACGAGAGCCTATGATTTGCCCAGGCGCGACCCGTGAATCGAGGTAATCGCCGACCAGATATTGCGAAACACCACATTACATGACTACTGTCCGCTTGAAGAGTTATATACTTGACAGTCCTGGTTGACGGCACAGCATATCTCCAATGTGTGGTTTAAAGTCTCACGTTCTTCATGCGCGCCGGCCCATGGGAACAGGTATCCTTACTTTCGGTACAAATGAGGCTCCAAAATAGCACGCTTGCAGCAGTCAAGTTGAACGCCTTAAAAGGCACCGCCGCTCGTTCATTGGGATTCCTTGAGAATCGTGACTTGTTACACTATAAGATCATGGATTGGACAAAATAGGCCAACTCCCGCACGCTGTGGCTATTCTTAAGTTGCATAGGTGGGAGTAGCCTTATACTCGATTTCTAAAAAGAGTAGGTGAGC
+>Seq4
+TTCCGGCGCCGCACTAATTGAAGTGGTGAGCTGACCAGTCGTTCAGGATCCGAAGGCGGGGATGGCGCTATAGGAGCCGGCAGGTATGCTTTGCCGCAAAATTTCGGGGTGGTGGAACCGTCTTACCGAAAGTTAGCTACAGCCTGGAATGTGAAATTCCATGACCTGCCCGTCCTGTGTCCACAGGGCGACATTTGCCACGTAGGTAGGGCGACCATTAGAATGCTGCATTATCGGGCGATAAAAAGTTTTATACCCAAGAATCCTACAAAGATGAAAATTTCGAAGAGCTGCACGCAGTTGTAAGTTGCTTTTCTGGGGTAATCGAGATTCTCCACCATAACCTGCGCAATGCATCGTGAAGCTTTACCGCGCCCAAGGGGAGCGTCTCAGTGGGGTTGCCTCCAGGGATATATTGAAAGTTGAAGAAGAAGATCACAGGTTAAGCGGTATGTTAAGTTAGAACTCACGGGGAGCCGCCTTGATTTTGTTCGACATGAACCAGAGACCAAGTGTGTTATGTTCTGGAACCTTAATACGTACGTCGCCAGCACCGAGCCGGCACTCCATCTCTTTTGGGTGCGCAACATTGCTATACTTAGGATCCATTGACATCTGTCAGCCGTCTTTCCAGAACGTTATAAGACTCGTGAGGAAATTATACAAATCGTTGCCATCATCCAAAGCAAAGTACTTCCGCTTAGGAGTGCCTTGAAGAACCGATTATCTCTGACAATGTAATGCCACAGCACCCTCGACAAAGTTCTACATTCGTTCCAGGTCATGATACAGCGCGCTAAATTACCGCTACGAGCCATACCCCGAACATTGAGACCTGGCCAGTAGGTAGGTGTCAAATCGATATCCACACCTGTCGAAGCAGCTAGGGACCTAGACGCAACAGTAACCGCCTCGGAGTAAGCCCTGGTAAAGATCGGTTGCGGCGGGAGTCCTCCATTCAGGCCAAACGTGCAGTGCTCGATGTGCTTCCTATCGCTCT


=====================================
debian/missing-sources/simple_test.sh
=====================================
@@ -0,0 +1,19 @@
+#!/bin/bash
+    
+rm -f reference.fasta
+#wget https://raw.githubusercontent.com/GATB/MindTheGap/f5cb0fec816686c7393772787d736565c4f056a4/test/full_test/reference.fasta >& /dev/null
+../build/bcalm -in reference.fasta -abundance-min 1 > /dev/null >& /dev/null
+rm -rf reference.unitigs.fa.glue*
+rm -f compare_fasta.py
+#wget https://raw.githubusercontent.com/GATB/minia/master/test/compare_fasta.py >& /dev/null
+python3 compare_fasta.py reference.fasta reference.unitigs.fa
+res=$?
+rm -f reference.fasta reference.h5 reference.unitigs.fa compare_fasta.py 
+if [ "$res" = "0" ]
+then
+    echo "test OK"
+    exit 0
+else
+    echo "test KO"
+    exit 1
+fi


=====================================
debian/source/include-binaries
=====================================
@@ -0,0 +1,3 @@
+debian/missing-sources/compare_fasta.py
+debian/missing-sources/reference.fasta
+debian/missing-sources/simple_test.sh



View it on GitLab: https://salsa.debian.org/med-team/bcalm/commit/f299ab0a3e8cb8aee0c733992af698ed94abbff1

-- 
View it on GitLab: https://salsa.debian.org/med-team/bcalm/commit/f299ab0a3e8cb8aee0c733992af698ed94abbff1
You're receiving this email because of your account on salsa.debian.org.


-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://alioth-lists.debian.net/pipermail/debian-med-commit/attachments/20190923/27c093f3/attachment-0001.html>


More information about the debian-med-commit mailing list