Skip to content

Commit

Permalink
Update to v0.12.8
Browse files Browse the repository at this point in the history
  • Loading branch information
ctsa committed Dec 13, 2024
1 parent 4a790c6 commit 35a11ab
Show file tree
Hide file tree
Showing 9 changed files with 72 additions and 27 deletions.
8 changes: 8 additions & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
@@ -1,5 +1,13 @@
# Change Log

## v0.12.8 - 2024-12-13

### Fixed

- Increase system open file limit (github #9)
- May simplify joint-call for large pedigrees at high thread counts
- Improve error message when split reads map to an unknown chromosome (github #8)

## v0.12.7 - 2024-10-23

### Fixed
Expand Down
16 changes: 13 additions & 3 deletions Cargo.lock

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

3 changes: 2 additions & 1 deletion Cargo.toml
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
[package]
name = "sawfish"
version = "0.12.7"
version = "0.12.8"
authors = ["Chris Saunders <csaunders@pacificbiosciences.com>"]
description = "Structural variant analysis for mapped PacBio HiFi reads"
edition = "2021"
Expand Down Expand Up @@ -32,6 +32,7 @@ num = "0.4"
num_cpus = "1"
rayon = "1"
regex = "1"
rlimit = "0"
rust-htslib = { version = "0.47", default-features = false }
rust-vc-utils = { path="lib/rust-vc-utils" }
rust-wfa2 = { git = "https://github.com/ctsa/rust-wfa2.git" }
Expand Down
11 changes: 10 additions & 1 deletion LICENSE-THIRDPARTY.json
Original file line number Diff line number Diff line change
Expand Up @@ -1448,6 +1448,15 @@
"license_file": null,
"description": "A regular expression parser."
},
{
"name": "rlimit",
"version": "0.10.2",
"authors": "Nugine <nugine@foxmail.com>",
"repository": "https://github.com/Nugine/rlimit/",
"license": "MIT",
"license_file": null,
"description": "Resource limits"
},
{
"name": "rmp",
"version": "0.8.14",
Expand Down Expand Up @@ -1576,7 +1585,7 @@
},
{
"name": "sawfish",
"version": "0.12.7",
"version": "0.12.8",
"authors": "Chris Saunders <csaunders@pacificbiosciences.com>",
"repository": null,
"license": null,
Expand Down
10 changes: 8 additions & 2 deletions src/bam_sa_parser.rs
Original file line number Diff line number Diff line change
Expand Up @@ -144,7 +144,7 @@ pub fn get_seq_order_read_split_segments(
read_size
};

for sa_segment in sa_segments.iter() {
for (sa_segment_index, sa_segment) in sa_segments.iter().enumerate() {
if !has_aligned_segments(&sa_segment.cigar) {
let qname = std::str::from_utf8(record.qname()).unwrap().to_string();
panic!("Bam record split segment id unaligned in read {qname}");
Expand All @@ -153,7 +153,13 @@ pub fn get_seq_order_read_split_segments(
assert_eq!(primary_read_size, read_size);
let (seq_order_read_start, seq_order_read_end) =
get_seq_order_read_pos(read_start, read_end, read_size, sa_segment.is_fwd_strand);
let chrom_index = *chrom_list.label_to_index.get(&sa_segment.rname).unwrap();
let chrom_index = match chrom_list.label_to_index.get(&sa_segment.rname) {
Some(&x) => x,
None => {
let qname = std::str::from_utf8(record.qname()).unwrap().to_string();
panic!("In read '{qname}', the SA aux tag desribes a split read mapped to {}:{} (in segment {}), which is not found in the input reference fasta", sa_segment.rname, sa_segment.pos, sa_segment_index);
}
};
seq_order_read_split_segments.push({
SeqOrderSplitReadSegment {
seq_order_read_start,
Expand Down
8 changes: 8 additions & 0 deletions src/main.rs
Original file line number Diff line number Diff line change
Expand Up @@ -47,6 +47,12 @@ use crate::globals::{PROGRAM_NAME, PROGRAM_VERSION};
use crate::joint_call::run_joint_call;
use crate::logger::setup_output_dir_and_logger;

/// Run system configuration steps prior to starting any other program logic
///
fn system_configuration_prelude() {
utils::attempt_max_open_file_limit();
}

fn run(settings: &cli::Settings) -> Result<(), Box<dyn error::Error>> {
info!("Starting {PROGRAM_NAME} {PROGRAM_VERSION}");
info!(
Expand Down Expand Up @@ -74,6 +80,8 @@ fn run(settings: &cli::Settings) -> Result<(), Box<dyn error::Error>> {
}

fn main() {
system_configuration_prelude();

let settings = cli::validate_and_fix_settings(cli::parse_settings());

// Setup logger, including creation of the output directory for the log file:
Expand Down
2 changes: 1 addition & 1 deletion src/refine_sv/assemble/banded_pairwise_assembler.rs
Original file line number Diff line number Diff line change
Expand Up @@ -53,7 +53,7 @@ struct BackboneAlignmentInfo {
// Align the next read to the backbone. If the read extends the backbone, then redefine the backbone with this extension.
// Repeat for all reads to form a fully extended backbone.
// Rejection scoring follows the same scheme as for POA, so we might be building multiple backbones.
///
//
// 2.Pairwise POA from each backbone
// For each backbone and its associated read set, pairwise align all reads in the set to the backbone, and take a majority vote on each edit to determine the consensus sequence.

Expand Down
20 changes: 3 additions & 17 deletions src/spoa_utils.rs
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,7 @@ use rust_htslib::bam::record::Cigar;
use spoa::{get_alignment_clip_size, get_alignment_overlap_size, AlignmentEngine, Graph};

use crate::simple_alignment::SimpleAlignment;
use crate::utils;

/// Create a new poa graph with only the given sequence
///
Expand Down Expand Up @@ -80,7 +81,7 @@ pub fn print_msa(alignments: &[CString]) {
assert_eq!(seq.len(), len);
}

let rows = (len + WIDTH - 1) / WIDTH;
let rows = len.div_ceil(WIDTH);

let ruler = {
let mut ruler = String::new();
Expand Down Expand Up @@ -129,23 +130,8 @@ pub fn print_msa(alignments: &[CString]) {
pub fn print_fasta(alignments: &[CString]) {
const WIDTH: usize = 100;

if alignments.is_empty() {
return;
}

let bytes = alignments.iter().map(|x| x.as_bytes()).collect::<Vec<_>>();

for (seq_index, seq) in bytes.iter().enumerate() {
let len = seq.len();
let rows = (len + WIDTH - 1) / WIDTH;

eprintln!("> {}", seq_index);
for row_index in 0..rows {
let start = WIDTH * row_index;
let end = std::cmp::min(start + WIDTH, len);
eprintln!("{}", std::str::from_utf8(&seq[start..end]).unwrap());
}
}
utils::print_fasta(WIDTH, &bytes);
}

/// Use spoa to get a consensus of two reads using the given alignment engine
Expand Down
21 changes: 19 additions & 2 deletions src/utils.rs
Original file line number Diff line number Diff line change
Expand Up @@ -190,7 +190,7 @@ pub fn pairwise_alignment_printer(width: usize, lines: &[&[u8]]) {
ruler
};

let rows = (len + width - 1) / width;
let rows = len.div_ceil(width);
for row_index in 0..rows {
let start = width * row_index;
let end = std::cmp::min(start + width, len);
Expand Down Expand Up @@ -219,7 +219,7 @@ pub fn print_fasta(width: usize, lines: &[&[u8]]) {

for (seq_index, seq) in lines.iter().enumerate() {
let len = seq.len();
let rows = (len + width - 1) / width;
let rows = len.div_ceil(width);

eprintln!("> {}", seq_index);
for row_index in 0..rows {
Expand Down Expand Up @@ -249,6 +249,23 @@ pub fn drop_true<T>(vec: &mut Vec<T>, drop_list: &[bool]) {
vec.retain(|_| !*drop.next().unwrap())
}

/// Attempt to increase open file limit to the system's hard limit on *nix-like systems
///
/// This is an optional increase so continue through all failure cases without error.
///
pub fn attempt_max_open_file_limit() {
use rlimit::Resource;

let (soft, hard) = match Resource::NOFILE.get() {
Ok(x) => x,
Err(_) => return,
};

if soft < hard {
rlimit::setrlimit(Resource::NOFILE, hard, hard).unwrap_or_default();
}
}

#[cfg(test)]
mod tests {
use super::*;
Expand Down

0 comments on commit 35a11ab

Please sign in to comment.