$ arrow --numWorkers 32 -r canu_de_novo.fasta -o canu_de_novo_pbalign_arrow.fasta canu_de_novo_pbalign_mapped.bam
'BASECALLERVERSION'
Traceback (most recent call last):
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcommand/cli/core.py", line 137, in _pacbio_main_runner
return_code = exe_main_func(*args, **kwargs)
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/GenomicConsensus/main.py", line 383, in args_runner
return tr.main()
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/GenomicConsensus/main.py", line 297, in main
with AlignmentSet(options.inputFilename) as peekFile:
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/dataset/DataSetIO.py", line 2723, in __init__
super(AlignmentSet, self).__init__(*files, **kwargs)
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/dataset/DataSetIO.py", line 1987, in __init__
super(ReadSet, self).__init__(*files, **kwargs)
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/dataset/DataSetIO.py", line 477, in __init__
self.updateCounts()
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/dataset/DataSetIO.py", line 2541, in updateCounts
self.assertIndexed()
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/dataset/DataSetIO.py", line 2371, in assertIndexed
self._assertIndexed((IndexedBamReader, CmpH5Reader))
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/dataset/DataSetIO.py", line 1944, in _assertIndexed
self._openFiles()
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/dataset/DataSetIO.py", line 2068, in _openFiles
resource = IndexedBamReader(location)
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/align/BamIO.py", line 388, in __init__
super(IndexedBamReader, self).__init__(fname, referenceFastaFname)
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/align/BamIO.py", line 202, in __init__
self._loadReadGroupInfo()
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/align/BamIO.py", line 115, in _loadReadGroupInfo
basecallerVersion = ".".join(ds["BASECALLERVERSION"].split(".")[0:2])
KeyError: 'BASECALLERVERSION'
[ERROR] 'BASECALLERVERSION'
Traceback (most recent call last):
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcommand/cli/core.py", line 137, in _pacbio_main_runner
return_code = exe_main_func(*args, **kwargs)
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/GenomicConsensus/main.py", line 383, in args_runner
return tr.main()
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/GenomicConsensus/main.py", line 297, in main
with AlignmentSet(options.inputFilename) as peekFile:
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/dataset/DataSetIO.py", line 2723, in __init__
super(AlignmentSet, self).__init__(*files, **kwargs)
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/dataset/DataSetIO.py", line 1987, in __init__
super(ReadSet, self).__init__(*files, **kwargs)
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/dataset/DataSetIO.py", line 477, in __init__
self.updateCounts()
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/dataset/DataSetIO.py", line 2541, in updateCounts
self.assertIndexed()
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/dataset/DataSetIO.py", line 2371, in assertIndexed
self._assertIndexed((IndexedBamReader, CmpH5Reader))
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/dataset/DataSetIO.py", line 1944, in _assertIndexed
self._openFiles()
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/dataset/DataSetIO.py", line 2068, in _openFiles
resource = IndexedBamReader(location)
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/align/BamIO.py", line 388, in __init__
super(IndexedBamReader, self).__init__(fname, referenceFastaFname)
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/align/BamIO.py", line 202, in __init__
self._loadReadGroupInfo()
File "/opt/pacbio/smrtlink/install/smrtlink-release_5.1.0.26412/bundles/smrttools/install/smrttools-release_5.1.0.26366/private/thirdparty/
python/python_2.7.9/site-packages/pbcore/io/align/BamIO.py", line 115, in _loadReadGroupInfo
basecallerVersion = ".".join(ds["BASECALLERVERSION"].split(".")[0:2])
KeyError: 'BASECALLERVERSION'
Polished assembly, or at least a user friendly error message explaining what BAM metadata is missing and ideally how to deal with it.
$ samtools view -h m12345_123456_123456.subreads.bam | head -n 100 | grep "^@"
@HD VN:1.5 SO:unknown pb:3.0.5
@RG ID: f5b4ffb6 PL:PACBIO DS:READTYPE=SUBREAD;Ipd:CodecV1=ip;PulseWidth:CodecV1=pw;BINDINGKIT=101-365-900;SEQUENCINGKIT=101-309-500;BASECALLERVERSION=5.0.0;FRAMERATEHZ=80.000000 PU:m12345_123456_123456 PM:SEQUEL
@PG ID:baz2bam PN:baz2bam VN:5.1.0.26367 CL:/opt/pacbio/ppa-5.1.0/bin/baz2bam /data/pa/m12345_123456_123456.baz -o /data/pa/m12345_123456_123456 --metadata /data/pa/.m12345_123456_123456.metadata.xml -j 12 -b 12 --progress --silent --minSubLength 50 --minSnr 3.750000 --adapters /data/pa/m12345_123456_123456.adapters.fasta --controlAdapters /data/pa/m12345_123456_123456.controls.adapters.fasta --controls /data/pa/m54047_180428_220428.controls.fasta
@PG ID:bazFormat PN:bazformat VN:1.3.0
@PG ID:bazwriter PN:bazwriter VN:5.1.0.26367
$ samtools view -h canu_de_novo_pbalign_mapped.bam | head -n 100 | grep "^@"
I might be able to combine the header-less mapped BAM files with header information from the unmapped BAM to restore the metadata...?
Frustratingly blastr v5.3 says it takes FASTA or bax.h5 files, recommends not using FASTA as no quality, yet says bax.h5 support is deprecated.
Do I may need to go back to our sequencing provider to get the bax.h5 files as well as the BAM files?