pub struct LazyCsvReader { /* private fields */ }
lazy
and csv
only.Implementations§
Source§impl LazyCsvReader
impl LazyCsvReader
pub fn new_paths(paths: Arc<[PathBuf]>) -> LazyCsvReader
pub fn new_with_sources(sources: ScanSources) -> LazyCsvReader
pub fn new(path: impl AsRef<Path>) -> LazyCsvReader
Sourcepub fn with_skip_rows_after_header(self, offset: usize) -> LazyCsvReader
pub fn with_skip_rows_after_header(self, offset: usize) -> LazyCsvReader
Skip this number of rows after the header location.
Sourcepub fn with_row_index(self, row_index: Option<RowIndex>) -> LazyCsvReader
pub fn with_row_index(self, row_index: Option<RowIndex>) -> LazyCsvReader
Add a row index column.
Sourcepub fn with_n_rows(self, num_rows: Option<usize>) -> LazyCsvReader
pub fn with_n_rows(self, num_rows: Option<usize>) -> LazyCsvReader
Try to stop parsing when n
rows are parsed. During multithreaded parsing the upper bound n
cannot
be guaranteed.
Sourcepub fn with_infer_schema_length(self, num_rows: Option<usize>) -> LazyCsvReader
pub fn with_infer_schema_length(self, num_rows: Option<usize>) -> LazyCsvReader
Set the number of rows to use when inferring the csv schema.
the default is 100 rows.
Setting to None
will do a full table scan, very slow.
Sourcepub fn with_ignore_errors(self, ignore: bool) -> LazyCsvReader
pub fn with_ignore_errors(self, ignore: bool) -> LazyCsvReader
Continue with next batch when a ParserError is encountered.
Sourcepub fn with_schema(self, schema: Option<Arc<Schema<DataType>>>) -> LazyCsvReader
pub fn with_schema(self, schema: Option<Arc<Schema<DataType>>>) -> LazyCsvReader
Set the CSV file’s schema
Sourcepub fn with_skip_rows(self, skip_rows: usize) -> LazyCsvReader
pub fn with_skip_rows(self, skip_rows: usize) -> LazyCsvReader
Skip the first n
rows during parsing. The header will be parsed at row n
.
Note that by row we mean valid CSV, encoding and comments are respected.
Sourcepub fn with_skip_lines(self, skip_lines: usize) -> LazyCsvReader
pub fn with_skip_lines(self, skip_lines: usize) -> LazyCsvReader
Skip the first n
lines during parsing. The header will be parsed at line n
.
We don’t respect CSV escaping when skipping lines.
Sourcepub fn with_dtype_overwrite(
self,
schema: Option<Arc<Schema<DataType>>>,
) -> LazyCsvReader
pub fn with_dtype_overwrite( self, schema: Option<Arc<Schema<DataType>>>, ) -> LazyCsvReader
Overwrite the schema with the dtypes in this given Schema. The given schema may be a subset of the total schema.
Sourcepub fn with_has_header(self, has_header: bool) -> LazyCsvReader
pub fn with_has_header(self, has_header: bool) -> LazyCsvReader
Set whether the CSV file has headers
Sourcepub fn with_chunk_size(self, chunk_size: usize) -> LazyCsvReader
pub fn with_chunk_size(self, chunk_size: usize) -> LazyCsvReader
Sets the chunk size used by the parser. This influences performance. This can be used as a way to reduce memory usage during the parsing at the cost of performance.
Sourcepub fn with_separator(self, separator: u8) -> LazyCsvReader
pub fn with_separator(self, separator: u8) -> LazyCsvReader
Set the CSV file’s column separator as a byte character
Sourcepub fn with_comment_prefix(
self,
comment_prefix: Option<PlSmallStr>,
) -> LazyCsvReader
pub fn with_comment_prefix( self, comment_prefix: Option<PlSmallStr>, ) -> LazyCsvReader
Set the comment prefix for this instance. Lines starting with this prefix will be ignored.
Sourcepub fn with_quote_char(self, quote_char: Option<u8>) -> LazyCsvReader
pub fn with_quote_char(self, quote_char: Option<u8>) -> LazyCsvReader
Set the char
used as quote char. The default is b'"'
. If set to None
quoting is disabled.
Sourcepub fn with_eol_char(self, eol_char: u8) -> LazyCsvReader
pub fn with_eol_char(self, eol_char: u8) -> LazyCsvReader
Set the char
used as end of line. The default is b'\n'
.
Sourcepub fn with_null_values(self, null_values: Option<NullValues>) -> LazyCsvReader
pub fn with_null_values(self, null_values: Option<NullValues>) -> LazyCsvReader
Set values that will be interpreted as missing/ null.
Sourcepub fn with_missing_is_null(self, missing_is_null: bool) -> LazyCsvReader
pub fn with_missing_is_null(self, missing_is_null: bool) -> LazyCsvReader
Treat missing fields as null.
Sourcepub fn with_cache(self, cache: bool) -> LazyCsvReader
pub fn with_cache(self, cache: bool) -> LazyCsvReader
Cache the DataFrame after reading.
Sourcepub fn with_low_memory(self, low_memory: bool) -> LazyCsvReader
pub fn with_low_memory(self, low_memory: bool) -> LazyCsvReader
Reduce memory usage at the expense of performance
Sourcepub fn with_encoding(self, encoding: CsvEncoding) -> LazyCsvReader
pub fn with_encoding(self, encoding: CsvEncoding) -> LazyCsvReader
Set CsvEncoding
Sourcepub fn with_try_parse_dates(self, try_parse_dates: bool) -> LazyCsvReader
Available on crate feature temporal
only.
pub fn with_try_parse_dates(self, try_parse_dates: bool) -> LazyCsvReader
temporal
only.Automatically try to parse dates/datetimes and time.
If parsing fails, columns remain of dtype DataType::String
.
Sourcepub fn with_raise_if_empty(self, raise_if_empty: bool) -> LazyCsvReader
pub fn with_raise_if_empty(self, raise_if_empty: bool) -> LazyCsvReader
Raise an error if CSV is empty (otherwise return an empty frame)
Sourcepub fn with_truncate_ragged_lines(
self,
truncate_ragged_lines: bool,
) -> LazyCsvReader
pub fn with_truncate_ragged_lines( self, truncate_ragged_lines: bool, ) -> LazyCsvReader
Truncate lines that are longer than the schema.
pub fn with_decimal_comma(self, decimal_comma: bool) -> LazyCsvReader
Sourcepub fn with_glob(self, toggle: bool) -> LazyCsvReader
pub fn with_glob(self, toggle: bool) -> LazyCsvReader
Expand path given via globbing rules.
pub fn with_cloud_options( self, cloud_options: Option<CloudOptions>, ) -> LazyCsvReader
Sourcepub fn with_schema_modify<F>(self, f: F) -> Result<LazyCsvReader, PolarsError>
pub fn with_schema_modify<F>(self, f: F) -> Result<LazyCsvReader, PolarsError>
Modify a schema before we run the lazy scanning.
Important! Run this function latest in the builder!
pub fn with_include_file_paths( self, include_file_paths: Option<PlSmallStr>, ) -> LazyCsvReader
Trait Implementations§
Source§impl Clone for LazyCsvReader
impl Clone for LazyCsvReader
Source§fn clone(&self) -> LazyCsvReader
fn clone(&self) -> LazyCsvReader
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
source
. Read moreSource§impl LazyFileListReader for LazyCsvReader
impl LazyFileListReader for LazyCsvReader
Source§fn with_rechunk(self, rechunk: bool) -> LazyCsvReader
fn with_rechunk(self, rechunk: bool) -> LazyCsvReader
Rechunk the memory to contiguous chunks when parsing is done.
Source§fn n_rows(&self) -> Option<usize>
fn n_rows(&self) -> Option<usize>
Try to stop parsing when n
rows are parsed. During multithreaded parsing the upper bound n
cannot
be guaranteed.
Source§fn cloud_options(&self) -> Option<&CloudOptions>
fn cloud_options(&self) -> Option<&CloudOptions>
CloudOptions used to list files.
Source§fn finish_no_glob(self) -> Result<LazyFrame, PolarsError>
fn finish_no_glob(self) -> Result<LazyFrame, PolarsError>
fn glob(&self) -> bool
Source§fn with_sources(self, sources: ScanSources) -> LazyCsvReader
fn with_sources(self, sources: ScanSources) -> LazyCsvReader
Source§fn with_n_rows(self, n_rows: impl Into<Option<usize>>) -> LazyCsvReader
fn with_n_rows(self, n_rows: impl Into<Option<usize>>) -> LazyCsvReader
Source§fn with_row_index(self, row_index: impl Into<Option<RowIndex>>) -> LazyCsvReader
fn with_row_index(self, row_index: impl Into<Option<RowIndex>>) -> LazyCsvReader
Source§fn concat_impl(&self, lfs: Vec<LazyFrame>) -> Result<LazyFrame, PolarsError>
fn concat_impl(&self, lfs: Vec<LazyFrame>) -> Result<LazyFrame, PolarsError>
Source§fn with_paths(self, paths: Arc<[PathBuf]>) -> Self
fn with_paths(self, paths: Arc<[PathBuf]>) -> Self
Auto Trait Implementations§
impl Freeze for LazyCsvReader
impl !RefUnwindSafe for LazyCsvReader
impl Send for LazyCsvReader
impl Sync for LazyCsvReader
impl Unpin for LazyCsvReader
impl !UnwindSafe for LazyCsvReader
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
§impl<T> Instrument for T
impl<T> Instrument for T
§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self> ⓘ
fn into_either(self, into_left: bool) -> Either<Self, Self> ⓘ
self
into a Left
variant of Either<Self, Self>
if into_left
is true
.
Converts self
into a Right
variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self> ⓘ
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self> ⓘ
self
into a Left
variant of Either<Self, Self>
if into_left(&self)
returns true
.
Converts self
into a Right
variant of Either<Self, Self>
otherwise. Read more