a port for the GenePred format in Rust
docs .
usage .
features .
examples
This library provides a port to read genomic interval data in BED, GTF, and GFF (+ gz/zst/bz2) formats, representing them all as GenePred records.
Add this to your Cargo.toml:
[dependencies]
genepred = "0.0.11"
# Optional features
genepred = { version = "0.0.11", features = ["gzip", "zstd", "bz2", "mmap", "rayon"] }// Enable both "rayon" and "mmap" features in Cargo.toml
use genepred::{Reader, Bed12, Gtf};
use rayon::prelude::*;
fn main() -> Result<(), Box<dyn std::error::Error>> {
// Parallel processing of BED files, includes .gz/.zst/.bz2 files
let bed_reader = Reader::<Bed12>::from_mmap("data/large.bed")?;
if let Ok(records) = bed_reader.par_records() {
let count = records
.filter_map(Result::ok)
.filter(|r| r.strand.map(|s| s.is_plus()).unwrap_or(false))
.count();
println!("Found {} records on plus strand", count);
}
// Parallel processing of GTF files, includes .gz/.zst/.bz2 files
let gtf_reader = Reader::<Gtf>::from_mmap("data/annotations.gtf")?;
if let Ok(records) = gtf_reader.par_records() {
let total_exons: usize = records
.filter_map(Result::ok)
.map(|r| r.exon_count())
.sum();
println!("Total exons: {}", total_exons);
}
Ok(())
}mmap: Enable memory-mapped file support (addsmemmap2dependency)rayon: Enable parallel processing (addsrayondependency)gzip: Enable gzip support (addsflate2dependency)zstd: Enable zstd support (addszstddependency)bz2: Enable bzip2 support (addsbzip2dependency)
