Struct ReadStatData

Source

pub struct ReadStatData {Show 14 fields
    pub var_count: i32,
    pub vars: Arc<BTreeMap<i32, ReadStatVarMetadata>>,
    pub(crate) builders: Vec<ColumnBuilder>,
    pub schema: Arc<Schema>,
    pub batch: Option<RecordBatch>,
    pub chunk_rows_to_process: usize,
    pub(crate) chunk_row_start: usize,
    pub(crate) chunk_row_end: usize,
    pub(crate) chunk_rows_processed: usize,
    pub(crate) total_rows_processed: Option<Arc<AtomicUsize>>,
    pub(crate) progress: Option<Arc<dyn ProgressCallback>>,
    pub(crate) abort_error: Option<ReadStatError>,
    pub(crate) column_filter: Option<Arc<BTreeMap<i32, i32>>>,
    pub(crate) total_var_count: i32,
}

Expand description

Holds parsed row data from a .sas7bdat file and converts it to Arrow format.

Each instance processes one streaming chunk of rows. Values are appended directly into typed Arrow ColumnBuilders during the handle_value callback, then finished into an Arrow [RecordBatch] via cols_to_batch.

Fields§

§var_count: i32

Number of variables (columns) in the dataset.

§vars: Arc<BTreeMap<i32, ReadStatVarMetadata>>

Per-variable metadata, keyed by variable index. Wrapped in Arc so parallel chunks share the same metadata without deep cloning.

§builders: Vec<ColumnBuilder>

Typed Arrow builders — one per variable, pre-sized with capacity hints.

§schema: Arc<Schema>

Arrow schema for the dataset. Wrapped in Arc for cheap sharing across parallel chunks.

§batch: Option<RecordBatch>

The Arrow RecordBatch produced after parsing, if available.

§chunk_rows_to_process: usize

Number of rows to process in this chunk.

§chunk_row_start: usize

Starting row offset for this chunk.

§chunk_row_end: usize

Ending row offset (exclusive) for this chunk.

§chunk_rows_processed: usize

Number of rows actually processed so far in this chunk.

§total_rows_processed: Option<Arc<AtomicUsize>>

Shared atomic counter of total rows processed across all chunks.

§progress: Option<Arc<dyn ProgressCallback>>

Optional progress callback for visual feedback during parsing.

§abort_error: Option<ReadStatError>

A typed error raised by a value callback that aborted parsing.

Set by handle_value (e.g. on date/time overflow or a builder/value type mismatch) and surfaced by the parse routines in preference to the generic USER_ABORT the C library reports for any callback abort.

§column_filter: Option<Arc<BTreeMap<i32, i32>>>

Optional mapping: original var index -> filtered column index. Wrapped in Arc so parallel chunks share the same filter without deep cloning.

§total_var_count: i32

Total variable count in the unfiltered dataset. Used for row-boundary detection in handle_value when filtering is active. Defaults to var_count when no filter is set.

Struct ReadStatData Copy item path

Fields§

Implementations§

impl ReadStatData

pub fn new() -> Self

pub fn allocate_builders(self) -> Self

pub(crate) fn cols_to_batch(&mut self) -> Result<(), ReadStatError>

pub(crate) fn note_value(&mut self, var_index: i32)

pub fn read_data(&mut self, rsp: &ReadStatPath) -> Result<(), ReadStatError>

§Errors

pub fn read_data_from_bytes( &mut self, bytes: &[u8], ) -> Result<(), ReadStatError>

§Errors

pub fn read_data_from_mmap(&mut self, path: &Path) -> Result<(), ReadStatError>

§Safety

§Errors

pub(crate) fn parse_data( &mut self, rsp: &ReadStatPath, ) -> Result<(), ReadStatError>

fn parse_data_from_bytes(&mut self, bytes: &[u8]) -> Result<(), ReadStatError>

pub fn init(self, md: ReadStatMetadata, row_start: u32, row_end: u32) -> Self

pub fn init_filtered( self, md: ReadStatMetadata, mapping: &BTreeMap<i32, i32>, row_start: u32, row_end: u32, ) -> Self

pub fn init_shared( self, var_count: i32, vars: Arc<BTreeMap<i32, ReadStatVarMetadata>>, schema: Arc<Schema>, row_start: u32, row_end: u32, ) -> Self

fn set_chunk_counts(self, row_start: u32, row_end: u32) -> Self

fn set_metadata(self, md: ReadStatMetadata) -> Self

pub fn set_total_rows_processed( self, total_rows_processed: Arc<AtomicUsize>, ) -> Self

pub fn set_column_filter( self, filter: Option<Arc<BTreeMap<i32, i32>>>, total_var_count: i32, ) -> Self

pub fn set_progress(self, progress: Arc<dyn ProgressCallback>) -> Self

Trait Implementations§

impl Default for ReadStatData

fn default() -> Self

Auto Trait Implementations§

impl Freeze for ReadStatData

impl !RefUnwindSafe for ReadStatData

impl Send for ReadStatData

impl Sync for ReadStatData

impl Unpin for ReadStatData

impl UnsafeUnpin for ReadStatData

impl !UnwindSafe for ReadStatData

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<ST, DT> CastableFrom<ST, Initialized, Initialized> for DTwhere ST: ?Sized, DT: ?Sized,

impl<ST, DT> CastableFrom<ST, Uninit, Uninit> for DTwhere ST: ?Sized, DT: ?Sized,

impl<T> Read<Exclusive, BecauseExclusive> for Twhere T: ?Sized,

Struct ReadStatData

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<ST, DT> CastableFrom<ST, Initialized, Initialized> for DT
where ST: ?Sized, DT: ?Sized,

impl<ST, DT> CastableFrom<ST, Uninit, Uninit> for DT
where ST: ?Sized, DT: ?Sized,

impl<T> Read<Exclusive, BecauseExclusive> for T
where T: ?Sized,