Struct polars_lazy::frame::LazyCsvReader
source · pub struct LazyCsvReader { /* private fields */ }
csv
only.Implementations§
source§impl LazyCsvReader
impl LazyCsvReader
pub fn new_paths(paths: Arc<[PathBuf]>) -> Self
pub fn new(path: impl AsRef<Path>) -> Self
sourcepub fn with_skip_rows_after_header(self, offset: usize) -> Self
pub fn with_skip_rows_after_header(self, offset: usize) -> Self
Skip this number of rows after the header location.
sourcepub fn with_row_index(self, row_index: Option<RowIndex>) -> Self
pub fn with_row_index(self, row_index: Option<RowIndex>) -> Self
Add a row index column.
sourcepub fn with_n_rows(self, num_rows: Option<usize>) -> Self
pub fn with_n_rows(self, num_rows: Option<usize>) -> Self
Try to stop parsing when n
rows are parsed. During multithreaded parsing the upper bound n
cannot
be guaranteed.
sourcepub fn with_infer_schema_length(self, num_rows: Option<usize>) -> Self
pub fn with_infer_schema_length(self, num_rows: Option<usize>) -> Self
Set the number of rows to use when inferring the csv schema.
the default is 100 rows.
Setting to None
will do a full table scan, very slow.
sourcepub fn with_ignore_errors(self, ignore: bool) -> Self
pub fn with_ignore_errors(self, ignore: bool) -> Self
Continue with next batch when a ParserError is encountered.
sourcepub fn with_schema(self, schema: Option<SchemaRef>) -> Self
pub fn with_schema(self, schema: Option<SchemaRef>) -> Self
Set the CSV file’s schema
sourcepub fn with_skip_rows(self, skip_rows: usize) -> Self
pub fn with_skip_rows(self, skip_rows: usize) -> Self
Skip the first n
rows during parsing. The header will be parsed at row n
.
sourcepub fn with_dtype_overwrite(self, schema: Option<SchemaRef>) -> Self
pub fn with_dtype_overwrite(self, schema: Option<SchemaRef>) -> Self
Overwrite the schema with the dtypes in this given Schema. The given schema may be a subset of the total schema.
sourcepub fn with_has_header(self, has_header: bool) -> Self
pub fn with_has_header(self, has_header: bool) -> Self
Set whether the CSV file has headers
sourcepub fn with_separator(self, separator: u8) -> Self
pub fn with_separator(self, separator: u8) -> Self
Set the CSV file’s column separator as a byte character
sourcepub fn with_comment_prefix(self, comment_prefix: Option<&str>) -> Self
pub fn with_comment_prefix(self, comment_prefix: Option<&str>) -> Self
Set the comment prefix for this instance. Lines starting with this prefix will be ignored.
sourcepub fn with_quote_char(self, quote_char: Option<u8>) -> Self
pub fn with_quote_char(self, quote_char: Option<u8>) -> Self
Set the char
used as quote char. The default is b'"'
. If set to [None]
quoting is disabled.
sourcepub fn with_eol_char(self, eol_char: u8) -> Self
pub fn with_eol_char(self, eol_char: u8) -> Self
Set the char
used as end of line. The default is b'\n'
.
sourcepub fn with_null_values(self, null_values: Option<NullValues>) -> Self
pub fn with_null_values(self, null_values: Option<NullValues>) -> Self
Set values that will be interpreted as missing/ null.
sourcepub fn with_missing_is_null(self, missing_is_null: bool) -> Self
pub fn with_missing_is_null(self, missing_is_null: bool) -> Self
Treat missing fields as null.
sourcepub fn with_cache(self, cache: bool) -> Self
pub fn with_cache(self, cache: bool) -> Self
Cache the DataFrame after reading.
sourcepub fn with_low_memory(self, low_memory: bool) -> Self
pub fn with_low_memory(self, low_memory: bool) -> Self
Reduce memory usage at the expense of performance
sourcepub fn with_encoding(self, encoding: CsvEncoding) -> Self
pub fn with_encoding(self, encoding: CsvEncoding) -> Self
Set CsvEncoding
sourcepub fn with_try_parse_dates(self, try_parse_dates: bool) -> Self
Available on crate feature temporal
only.
pub fn with_try_parse_dates(self, try_parse_dates: bool) -> Self
temporal
only.Automatically try to parse dates/datetimes and time.
If parsing fails, columns remain of dtype [DataType::String]
.
sourcepub fn with_raise_if_empty(self, raise_if_empty: bool) -> Self
pub fn with_raise_if_empty(self, raise_if_empty: bool) -> Self
Raise an error if CSV is empty (otherwise return an empty frame)
sourcepub fn with_truncate_ragged_lines(self, truncate_ragged_lines: bool) -> Self
pub fn with_truncate_ragged_lines(self, truncate_ragged_lines: bool) -> Self
Truncate lines that are longer than the schema.
pub fn with_decimal_comma(self, decimal_comma: bool) -> Self
pub fn with_cloud_options(self, cloud_options: Option<CloudOptions>) -> Self
sourcepub fn with_schema_modify<F>(self, f: F) -> PolarsResult<Self>
pub fn with_schema_modify<F>(self, f: F) -> PolarsResult<Self>
Modify a schema before we run the lazy scanning.
Important! Run this function latest in the builder!
Trait Implementations§
source§impl Clone for LazyCsvReader
impl Clone for LazyCsvReader
source§fn clone(&self) -> LazyCsvReader
fn clone(&self) -> LazyCsvReader
1.0.0 · source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
source
. Read moresource§impl LazyFileListReader for LazyCsvReader
impl LazyFileListReader for LazyCsvReader
source§fn with_rechunk(self, rechunk: bool) -> Self
fn with_rechunk(self, rechunk: bool) -> Self
Rechunk the memory to contiguous chunks when parsing is done.
source§fn n_rows(&self) -> Option<usize>
fn n_rows(&self) -> Option<usize>
Try to stop parsing when n
rows are parsed. During multithreaded parsing the upper bound n
cannot
be guaranteed.
source§fn finish_no_glob(self) -> PolarsResult<LazyFrame>
fn finish_no_glob(self) -> PolarsResult<LazyFrame>
fn glob(&self) -> bool
fn paths(&self) -> &[PathBuf]
source§fn with_path(self, path: PathBuf) -> Self
fn with_path(self, path: PathBuf) -> Self
source§fn with_paths(self, paths: Arc<[PathBuf]>) -> Self
fn with_paths(self, paths: Arc<[PathBuf]>) -> Self
source§fn with_row_index(self, row_index: impl Into<Option<RowIndex>>) -> Self
fn with_row_index(self, row_index: impl Into<Option<RowIndex>>) -> Self
source§fn cloud_options(&self) -> Option<&CloudOptions>
fn cloud_options(&self) -> Option<&CloudOptions>
source§fn iter_paths(&self) -> PolarsResult<Option<PathIterator>>
fn iter_paths(&self) -> PolarsResult<Option<PathIterator>>
Auto Trait Implementations§
impl Freeze for LazyCsvReader
impl !RefUnwindSafe for LazyCsvReader
impl Send for LazyCsvReader
impl Sync for LazyCsvReader
impl Unpin for LazyCsvReader
impl !UnwindSafe for LazyCsvReader
Blanket Implementations§
source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
source§impl<T> IntoEither for T
impl<T> IntoEither for T
source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
self
into a Left
variant of Either<Self, Self>
if into_left
is true
.
Converts self
into a Right
variant of Either<Self, Self>
otherwise. Read moresource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
self
into a Left
variant of Either<Self, Self>
if into_left(&self)
returns true
.
Converts self
into a Right
variant of Either<Self, Self>
otherwise. Read more