Repository Analysis

pola-rs/polars

Extremely fast Query Engine for DataFrames, written in Rust

8.2 Low AI signal View on GitHub
8.2
Adjusted Score
8.2
Raw Score
100%
Time Factor
2026-05-29
Last Push
38,625
Stars
Rust
Language
773,030
Lines of Code
3126
Files
5472
Pattern Hits
2026-05-31
Scan Date

Score History

Severity Breakdown

CRITICAL 0HIGH 212MEDIUM 252LOW 5008

Pattern Findings

5472 matches across 17 categories. Click a row to expand file-level details.

Hyper-Verbose Identifiers3132 hits · 2946 pts
SeverityFileLineSnippet
LOWpy-polars/tests/benchmark/test_io.py12def test_write_read_scan_large_csv(groupby_data: pl.DataFrame, tmp_path: Path) -> None:
LOWpy-polars/tests/benchmark/test_join_where.py29def test_non_strict_inequalities(east_west: tuple[pl.DataFrame, pl.DataFrame]) -> None:
LOWpy-polars/tests/benchmark/test_join_where.py94def test_join_where_invalid_column() -> None:
LOWpy-polars/tests/benchmark/interop/test_numpy.py44def test_to_numpy_series_zero_copy(floats: pl.Series) -> None:
LOWpy-polars/tests/benchmark/interop/test_numpy.py48def test_to_numpy_series_with_nulls(floats_with_nulls: pl.Series) -> None:
LOWpy-polars/tests/benchmark/interop/test_numpy.py52def test_to_numpy_series_chunked(floats_chunked: pl.Series) -> None:
LOWpy-polars/tests/unit/conftest.py222def memory_usage_without_pyarrow() -> Generator[MemoryUsage, Any, Any]:
LOWpy-polars/tests/unit/test_schema.py6def test_contains_dtype_top_level() -> None:
LOWpy-polars/tests/unit/test_schema.py12def test_contains_dtype_recursive_nested() -> None:
LOWpy-polars/tests/unit/test_schema.py18def test_contains_dtype_recursive_struct() -> None:
LOWpy-polars/tests/unit/series/test_describe.py26def test_series_describe_float() -> None:
LOWpy-polars/tests/unit/series/test_describe.py45def test_series_describe_string() -> None:
LOWpy-polars/tests/unit/series/test_describe.py59def test_series_describe_boolean() -> None:
LOWpy-polars/tests/unit/series/test_describe.py77def test_series_describe_date() -> None:
LOWpy-polars/tests/unit/series/test_describe.py95def test_series_describe_empty() -> None:
LOWpy-polars/tests/unit/series/test_describe.py106def test_series_describe_null() -> None:
LOWpy-polars/tests/unit/series/test_describe.py117def test_series_describe_nested_list() -> None:
LOWpy-polars/tests/unit/series/test_getitem.py45def test_series_getitem_range(rng: range, expected_values: list[int]) -> None:
LOWpy-polars/tests/unit/series/test_getitem.py60def test_series_getitem_boolean_mask(mask: Any) -> None:
LOWpy-polars/tests/unit/series/test_getitem.py73def test_series_getitem_empty_inputs(input: Any) -> None:
LOWpy-polars/tests/unit/series/test_getitem.py81def test_series_getitem_multiple_indices(indices: Any) -> None:
LOWpy-polars/tests/unit/series/test_getitem.py88def test_series_getitem_numpy() -> None:
LOWpy-polars/tests/unit/series/test_getitem.py115def test_series_getitem_col_invalid_inputs(input: Any, match: str) -> None:
LOWpy-polars/tests/unit/series/test_rolling.py29def test_series_rolling_min_by(values: pl.Series, by_col: pl.Series) -> None:
LOWpy-polars/tests/unit/series/test_rolling.py35def test_series_rolling_max_by(values: pl.Series, by_col: pl.Series) -> None:
LOWpy-polars/tests/unit/series/test_rolling.py41def test_series_rolling_sum_by(values: pl.Series, by_col: pl.Series) -> None:
LOWpy-polars/tests/unit/series/test_rolling.py47def test_series_rolling_mean_by(values: pl.Series, by_col: pl.Series) -> None:
LOWpy-polars/tests/unit/series/test_rolling.py82def test_series_rolling_rank_by_with_nulls(
LOWpy-polars/tests/unit/series/test_rolling.py91def test_series_rolling_quantile_by_with_nulls(
LOWpy-polars/tests/unit/series/test_rolling.py100def test_series_rolling_median_by(values: pl.Series, by_col: pl.Series) -> None:
LOWpy-polars/tests/unit/series/test_rolling.py106def test_series_rolling_std_by(values: pl.Series, by_col: pl.Series) -> None:
LOWpy-polars/tests/unit/series/test_rolling.py112def test_series_rolling_var_by(values: pl.Series, by_col: pl.Series) -> None:
LOWpy-polars/tests/unit/series/test_rolling.py118def test_series_rolling_quantile_by(values: pl.Series, by_col: pl.Series) -> None:
LOWpy-polars/tests/unit/series/test_rolling.py124def test_series_rolling_rank_by(values: pl.Series, by_col: pl.Series) -> None:
LOWpy-polars/tests/unit/series/test_rolling.py130def test_series_rolling_min_by_temporal(
LOWpy-polars/tests/unit/series/test_rolling.py138def test_series_rolling_max_by_temporal(
LOWpy-polars/tests/unit/series/test_rolling.py146def test_series_rolling_sum_by_temporal(
LOWpy-polars/tests/unit/series/test_rolling.py154def test_series_rolling_mean_by_temporal(
LOWpy-polars/tests/unit/series/test_rolling.py162def test_series_rolling_median_by_temporal(
LOWpy-polars/tests/unit/series/test_rolling.py170def test_series_rolling_std_by_temporal(
LOWpy-polars/tests/unit/series/test_rolling.py178def test_series_rolling_var_by_temporal(
LOWpy-polars/tests/unit/series/test_rolling.py186def test_series_rolling_quantile_by_temporal(
LOWpy-polars/tests/unit/series/test_rolling.py194def test_series_rolling_rank_by_temporal(
LOWpy-polars/tests/unit/series/test_rolling.py64def test_series_rolling_by_with_nulls(
LOWpy-polars/tests/unit/series/test_equals.py53def test_series_equals_check_names() -> None:
LOWpy-polars/tests/unit/series/test_equals.py124def test_series_equals_strict_deprecated() -> None:
LOWpy-polars/tests/unit/series/test_scatter.py93def test_scatter_logical_all_null() -> None:
LOWpy-polars/tests/unit/series/test_zip_with.py7def test_zip_with_all_true_mask() -> None:
LOWpy-polars/tests/unit/series/test_zip_with.py16def test_zip_with_all_false_mask() -> None:
LOWpy-polars/tests/unit/series/test_zip_with.py35def test_zip_with_series_comparison() -> None:
LOWpy-polars/tests/unit/series/test_zip_with.py44def test_zip_with_null_values() -> None:
LOWpy-polars/tests/unit/series/test_zip_with.py54def test_zip_with_length_mismatch() -> None:
LOWpy-polars/tests/unit/series/test_zip_with.py63def test_zip_with_bad_input_type() -> None:
LOWpy-polars/tests/unit/series/test_item.py22def test_series_item_incorrect_shape() -> None:
LOWpy-polars/tests/unit/series/test_item.py34def test_series_item_with_index(index: int, expected: int, s: pl.Series) -> None:
LOWpy-polars/tests/unit/series/test_item.py39def test_df_item_out_of_bounds(index: int, s: pl.Series) -> None:
LOWpy-polars/tests/unit/series/test_item.py45def test_series_item_out_of_range_date() -> None:
LOWpy-polars/tests/unit/series/test_extend.py46def test_extend_with_null_series() -> None:
LOWpy-polars/tests/unit/series/test_series.py2235def test_series_getitem_out_of_bounds_positive() -> None:
LOWpy-polars/tests/unit/series/test_series.py2243def test_series_getitem_out_of_bounds_negative() -> None:
3072 more matches not shown…
Cross-Language Confusion201 hits · 892 pts
SeverityFileLineSnippet
HIGHpy-polars/tests/unit/series/test_equals.py14 assert s1.equals(s2) is True
HIGHpy-polars/tests/unit/series/test_equals.py15 assert s1.equals(s2, check_dtypes=True) is False
HIGHpy-polars/tests/unit/series/test_equals.py16 assert s1.equals(s2, null_equal=False) is False
HIGHpy-polars/tests/unit/series/test_equals.py28 assert s3.equals(s4) is False
HIGHpy-polars/tests/unit/series/test_equals.py29 assert s3.equals(s4, check_dtypes=True) is False
HIGHpy-polars/tests/unit/series/test_equals.py30 assert s3.equals(s4, null_equal=False) is False
HIGHpy-polars/tests/unit/series/test_equals.py37 s1.equals(pl.DataFrame(s2), check_names=False) # type: ignore[arg-type]
HIGHpy-polars/tests/unit/series/test_equals.py43 s1.equals(pl.DataFrame(s2).lazy(), check_names=False) # type: ignore[arg-type]
HIGHpy-polars/tests/unit/series/test_equals.py50 assert s5.equals(DummySeriesSubclass(s5)) is True
HIGHpy-polars/tests/unit/series/test_equals.py56 assert s1.equals(s2) is True
HIGHpy-polars/tests/unit/series/test_equals.py57 assert s1.equals(s2, check_names=True) is False
HIGHpy-polars/tests/unit/series/test_equals.py128 assert not s1.equals(s2, strict=True) # type: ignore[call-arg]
HIGHpy-polars/tests/unit/series/test_equals.py321 assert s.equals(s)
HIGHpy-polars/tests/unit/series/test_series.py2377 assert calculated.equals(expected)
HIGHpy-polars/tests/unit/dataframe/test_df.py3339 assert df.equals(expected)
HIGHpy-polars/tests/unit/dataframe/test_df.py3346 assert df.equals(expected)
HIGHpy-polars/tests/unit/dataframe/test_equals.py23 assert df1.equals(df1) is True
HIGHpy-polars/tests/unit/dataframe/test_equals.py24 assert df1.equals(df2) is False
HIGHpy-polars/tests/unit/dataframe/test_equals.py34 assert df1.equals(df3) is False
HIGHpy-polars/tests/unit/dataframe/test_equals.py44 assert df.equals(df.with_columns(pl.col("foo").cast(pl.Int8))) is True
HIGHpy-polars/tests/unit/dataframe/test_equals.py45 assert df.equals(df.with_columns(pl.col("ham").cast(pl.Categorical))) is True
HIGHpy-polars/tests/unit/dataframe/test_equals.py48 assert df.equals(df) is True
HIGHpy-polars/tests/unit/dataframe/test_equals.py49 assert df.equals(df, null_equal=False) is False
HIGHpy-polars/tests/unit/dataframe/test_equals.py60 df1.equals(df2.lazy()) # type: ignore[arg-type]
HIGHpy-polars/tests/unit/dataframe/test_equals.py66 df1.equals(pl.Series([1, 2, 3])) # type: ignore[arg-type]
HIGHpy-polars/tests/unit/dataframe/test_equals.py73 assert df1.equals(df2) is True
HIGHpy-polars/tests/unit/dataframe/test_glimpse.py52 $ d <str> null, 'b', 'c'
HIGHpy-polars/tests/unit/dataframe/test_0_width_df.py10 assert df.equals(df)
HIGHpy-polars/tests/unit/dataframe/test_0_width_df.py11 assert not df.equals(pl.DataFrame())
HIGHpy-polars/tests/unit/datatypes/test_list.py868 assert expected.equals(actual)
HIGHpy-polars/tests/unit/datatypes/test_temporal.py381 assert s.equals(tz_s, null_equal=False) is False
HIGHpy-polars/tests/unit/datatypes/test_temporal.py382 assert s.equals(tz_s, null_equal=True) is False
HIGHpy-polars/tests/unit/datatypes/test_datatype_exprs.py84 (pl.List(pl.Null()), "list", "list[null]", None),
HIGHpy-polars/tests/unit/datatypes/test_datatype_exprs.py92 (pl.Array(pl.Null(), 2), "array", "array[null, 2]", 0),
HIGHpy-polars/tests/unit/interop/test_from_pandas.py405 pd_df = pd.DataFrame({"col": ["a", null]})
HIGHpy-polars/tests/unit/interop/test_interop.py374 # Create a pyarrow table with a list[null] column.
HIGHpy-polars/tests/unit/interop/test_interop.py1018 assert df.equals(df_res)
HIGHpy-polars/tests/unit/io/test_ipc.py117 assert pd_df.equals(pd_df_read)
HIGHpy-polars/tests/unit/io/test_lazy_parquet.py1026assert [x.equals(pl.DataFrame({"x": 1})) for x in results] == [
HIGHpy-polars/tests/unit/io/test_lazy_json.py302{"a": {"x": 1}, "b": [1,2,3], "c": {"y": null}, "d": [{"k": "abc"}, {"j": "123"}, {"l": 7, "m": 8}]}
HIGHpy-polars/tests/unit/io/test_lazy_json.py316 "c": '{"y": null}',
HIGHpy-polars/tests/unit/io/test_json.py226 assert out == '{"a":1,"b":"a"}\n{"a":2,"b":"b"}\n{"a":3,"b":null}\n'
HIGHpy-polars/tests/unit/io/test_json.py373 {"id": 1, "zero_column": 0, "empty_array_column": [], "empty_object_column": {}, "null_column": null}
HIGHpy-polars/tests/unit/io/test_json.py374 {"id": 2, "zero_column": 0, "empty_array_column": [], "empty_object_column": {}, "null_column": null}
HIGHpy-polars/tests/unit/io/test_json.py375 {"id": 3, "zero_column": 0, "empty_array_column": [], "empty_object_column": {}, "null_column": null}
HIGHpy-polars/tests/unit/io/test_json.py376 {"id": 4, "zero_column": 0, "empty_array_column": [], "empty_object_column": {}, "null_column": null}
HIGHpy-polars/tests/unit/io/test_json.py594 {"a": null},
HIGHpy-polars/tests/unit/io/test_json.py36 assert out == '[{"a":1,"b":"a"},{"a":2,"b":"b"},{"a":3,"b":null}]'
HIGHpy-polars/tests/unit/io/test_json.py159 assert value == """[{"a":"1.00"},{"a":"2.00"},{"a":null}]"""
HIGHpy-polars/tests/unit/io/test_json.py397 {"map": "a", "start_time": null, "end_time": null}
HIGHpy-polars/tests/unit/io/test_json.py178 {"a": 5, "b": "foo", "c": null},
HIGHpy-polars/tests/unit/io/test_json.py179 {"a": 11.4, "b": null, "c": true, "d": 8},
HIGHpy-polars/tests/unit/io/test_json.py201 {"a": 5, "b": "foo", "c": null},
HIGHpy-polars/tests/unit/io/test_json.py202 {"a": 11.4, "b": null, "c": true, "d": 8},
HIGHpy-polars/tests/unit/io/test_json.py645 io.StringIO("""{"a":null,"b":null,"c":null}"""),
HIGHpy-polars/tests/unit/io/test_csv.py1035 df.write_csv(f, null_value=null)
HIGHpy-polars/tests/unit/io/test_csv.py1037 df_read = pl.read_csv(f, null_values=null)
HIGHpy-polars/tests/unit/io/test_csv.py2410 assert df.equals(pl.read_csv(f, schema={"x": dtype}))
HIGHpy-polars/tests/unit/meta/test_errors.py724 match=r"shift value 'n' is null, which currently returns a column of null values. This will become an error in t
HIGHpy-polars/tests/unit/operations/test_is_sorted.py34 # left all-null, right 0 < null_count < len
141 more matches not shown…
Unused Imports1054 hits · 876 pts
SeverityFileLineSnippet
LOWpy-polars/tests/conftest.py1
LOWpy-polars/tests/benchmark/test_group_by.py10
LOWpy-polars/tests/benchmark/test_filter.py3
LOWpy-polars/tests/benchmark/test_join_where.py3
LOWpy-polars/tests/benchmark/interop/test_numpy.py3
LOWpy-polars/tests/benchmark/data/__init__.py3
LOWpy-polars/tests/benchmark/data/h2oai/__init__.py3
LOWpy-polars/tests/unit/conftest.py1
LOWpy-polars/tests/unit/test_schema.py1
LOWpy-polars/tests/unit/series/test_to_list.py1
LOWpy-polars/tests/unit/series/test_getitem.py1
LOWpy-polars/tests/unit/series/test_item.py1
LOWpy-polars/tests/unit/series/test_contains.py1
LOWpy-polars/tests/unit/series/test_all_any.py1
LOWpy-polars/tests/unit/series/test_series.py1
LOW…-polars/tests/unit/series/buffers/test_from_buffers.py1
LOWpy-polars/tests/unit/series/buffers/test_from_buffer.py1
LOWpy-polars/tests/unit/dataframe/test_from_dict.py1
LOWpy-polars/tests/unit/dataframe/test_df.py1
LOWpy-polars/tests/unit/dataframe/test_upsample.py1
LOWpy-polars/tests/unit/dataframe/test_describe.py1
LOWpy-polars/tests/unit/dataframe/test_null_count.py1
LOWpy-polars/tests/unit/dataframe/test_getitem.py1
LOWpy-polars/tests/unit/dataframe/test_glimpse.py1
LOWpy-polars/tests/unit/dataframe/test_repr.py1
LOWpy-polars/tests/unit/dataframe/test_item.py1
LOWpy-polars/tests/unit/dataframe/test_to_dict.py1
LOWpy-polars/tests/unit/dataframe/test_serde.py1
LOWpy-polars/tests/unit/datatypes/test_duration.py1
LOWpy-polars/tests/unit/datatypes/test_utils.py1
LOWpy-polars/tests/unit/datatypes/test_extension.py1
LOWpy-polars/tests/unit/datatypes/test_list.py1
LOWpy-polars/tests/unit/datatypes/test_datatypes.py1
LOWpy-polars/tests/unit/datatypes/test_parse.py1
LOWpy-polars/tests/unit/datatypes/test_decimal.py1
LOWpy-polars/tests/unit/datatypes/test_temporal.py1
LOWpy-polars/tests/unit/datatypes/test_categorical.py1
LOWpy-polars/tests/unit/datatypes/test_struct.py1
LOWpy-polars/tests/unit/datatypes/test_bool.py1
LOWpy-polars/tests/unit/datatypes/test_null.py1
LOWpy-polars/tests/unit/datatypes/test_categories.py1
LOWpy-polars/tests/unit/datatypes/test_object.py1
LOWpy-polars/tests/unit/datatypes/test_datatype_exprs.py1
LOWpy-polars/tests/unit/datatypes/test_enum.py2
LOWpy-polars/tests/unit/interop/test_arrow_stream_error.py3
LOWpy-polars/tests/unit/interop/test_from_pandas.py1
LOWpy-polars/tests/unit/interop/test_to_init_repr.py1
LOWpy-polars/tests/unit/interop/test_to_init_repr.py3
LOWpy-polars/tests/unit/interop/test_interop.py1
LOWpy-polars/tests/unit/interop/test_to_pandas.py1
LOWpy-polars/tests/unit/interop/numpy/test_to_numpy_df.py1
LOWpy-polars/tests/unit/interop/numpy/test_ufunc_expr.py1
LOW…-polars/tests/unit/interop/numpy/test_from_numpy_df.py1
LOW…olars/tests/unit/interop/numpy/test_to_numpy_series.py1
LOW…ars/tests/unit/interop/numpy/test_from_numpy_series.py1
LOWpy-polars/tests/unit/io/test_ipc.py1
LOWpy-polars/tests/unit/io/test_lazy_ipc.py1
LOWpy-polars/tests/unit/io/test_parquet.py1
LOWpy-polars/tests/unit/io/test_sink.py1
LOWpy-polars/tests/unit/io/test_utils.py1
994 more matches not shown…
Decorative Section Separators214 hits · 698 pts
SeverityFileLineSnippet
MEDIUM…polars-plan/src/plans/optimizer/slice_pushdown_expr.rs310 // ┌──────►==◄─────┐ (current expr)
MEDIUM…polars-plan/src/plans/optimizer/slice_pushdown_expr.rs318 // ┌──────┐ ┌──────┐ │
MEDIUM…polars-plan/src/plans/optimizer/slice_pushdown_expr.rs320 // └──────┘ └──────┘
MEDIUM…lars-plan/src/plans/conversion/type_coercion/binary.rs439 // ┌─────────────────────┬─────────────────────┬──────┐
MEDIUM…lars-plan/src/plans/conversion/type_coercion/binary.rs443 // ╞═════════════════════╪═════════════════════╪══════╡
MEDIUM…lars-plan/src/plans/conversion/type_coercion/binary.rs447 // └─────────────────────┴─────────────────────┴──────┘
MEDIUM…lars-plan/src/plans/conversion/type_coercion/binary.rs461 // ┌─────────────────────────────────┬─────┬───────┐
MEDIUM…lars-plan/src/plans/conversion/type_coercion/binary.rs465 // ╞═════════════════════════════════╪═════╪═══════╡
MEDIUM…lars-plan/src/plans/conversion/type_coercion/binary.rs469 // └─────────────────────────────────┴─────┴───────┘
MEDIUMcrates/polars-plan/src/dsl/mod.rs813 /// ╭────────┬────────╮
MEDIUMcrates/polars-plan/src/dsl/mod.rs817 /// ╞════════╪════════╡
MEDIUMcrates/polars-plan/src/dsl/mod.rs828 /// ╰────────┴────────╯
MEDIUMcrates/polars-row/src/lib.rs144//! ┌──────────┐ ┌─────┐
MEDIUMcrates/polars-row/src/lib.rs145//! │ "Bar" │ ───────────────▶│ 01 │
MEDIUMcrates/polars-row/src/lib.rs146//! └──────────┘ └─────┘
MEDIUMcrates/polars-row/src/lib.rs147//! ┌──────────┐ ┌─────┬─────┐
MEDIUMcrates/polars-row/src/lib.rs148//! │"Fabulous"│ ───────────────▶│ 01 │ 02 │
MEDIUMcrates/polars-row/src/lib.rs149//! └──────────┘ └─────┴─────┘
MEDIUMcrates/polars-row/src/lib.rs150//! ┌──────────┐ ┌─────┐
MEDIUMcrates/polars-row/src/lib.rs151//! │ "Soup" │ ───────────────▶│ 05 │
MEDIUMcrates/polars-row/src/lib.rs152//! └──────────┘ └─────┘
MEDIUMcrates/polars-row/src/lib.rs153//! ┌──────────┐ ┌─────┐
MEDIUMcrates/polars-row/src/lib.rs154//! │ "ZZ" │ ───────────────▶│ 07 │
MEDIUMcrates/polars-row/src/lib.rs155//! └──────────┘ └─────┘
MEDIUMcrates/polars-row/src/lib.rs162//! ┌─────┬─────┬─────┬─────┐
MEDIUMcrates/polars-row/src/lib.rs164//! └─────┴─────┴─────┴─────┘
MEDIUMcrates/polars-row/src/lib.rs166//! ┌─────┬─────┬─────┐
MEDIUMcrates/polars-row/src/lib.rs168//! └─────┴─────┴─────┘
MEDIUMcrates/polars-row/src/lib.rs170//! ┌─────┐
MEDIUMcrates/polars-row/src/lib.rs172//! └─────┘
MEDIUMcrates/polars-row/src/lib.rs188//! ┌───────┬────────────────────────┬───────┐
MEDIUMcrates/polars-row/src/lib.rs190//! └───────┴────────────────────────┴───────┘
MEDIUMcrates/polars-row/src/lib.rs196//! ┌───────┬───────────────┬───────┬─────────┬───────┐
MEDIUMcrates/polars-row/src/lib.rs198//! └───────┴───────────────┴───────┴─────────┴───────┘
MEDIUMcrates/polars-row/src/lib.rs239//! └──── rows ────┘ └───────── row lengths ─────────┘ └─ count ─┘
MEDIUMcrates/polars/src/docs/eager.rs371//! // ╭─────┬─────╮
MEDIUMcrates/polars/src/docs/eager.rs375//! // ╞═════╪═════╡
MEDIUMcrates/polars/src/docs/eager.rs379//! // ╰─────┴─────╯
MEDIUMcrates/polars/src/docs/lazy.rs60//! // ╭─────┬─────╮
MEDIUMcrates/polars/src/docs/lazy.rs64//! // ╞═════╪═════╡
MEDIUMcrates/polars/src/docs/lazy.rs66//! // ╰─────┴─────╯
MEDIUMcrates/polars/src/docs/lazy.rs90//! // ╭─────┬─────╮
MEDIUMcrates/polars/src/docs/lazy.rs94//! // ╞═════╪═════╡
MEDIUMcrates/polars/src/docs/lazy.rs98//! // ╰─────┴─────╯
MEDIUMcrates/polars/src/docs/lazy.rs148//! // ╭─────┬─────┬─────┬──────┬─────────╮
MEDIUMcrates/polars/src/docs/lazy.rs152//! // ╞═════╪═════╪═════╪══════╪═════════╡
MEDIUMcrates/polars/src/docs/lazy.rs159//! // ╰─────┴─────┴─────┴──────┴─────────╯
MEDIUMcrates/polars/src/docs/lazy.rs218//! // ╭───────┬───────┬───────┬────────────╮
MEDIUMcrates/polars/src/docs/lazy.rs222//! // ╞═══════╪═══════╪═══════╪════════════╡
MEDIUMcrates/polars/src/docs/lazy.rs233//! // ╰───────┴───────┴───────┴────────────╯
MEDIUMpy-polars/pyproject.toml217 # ------------------------------------------------------------------
MEDIUMpy-polars/pyproject.toml219 # ------------------------------------------------------------------
MEDIUMpy-polars/pyproject.toml223 # ------------------------------------------------------------------
MEDIUMpy-polars/requirements-dev.txt14# ------------
MEDIUMpy-polars/requirements-dev.txt16# ------------
MEDIUMpy-polars/requirements-ci.txt1# -------------------------------------------------------
MEDIUMpy-polars/requirements-ci.txt4# -------------------------------------------------------
MEDIUMpy-polars/tests/unit/dataframe/test_from_dict.py21 # ┌─────┬─────┐
MEDIUMpy-polars/tests/unit/dataframe/test_from_dict.py25 # ╞═════╪═════╡
MEDIUMpy-polars/tests/unit/dataframe/test_from_dict.py28 # └─────┴─────┘
154 more matches not shown…
Over-Commented Block651 hits · 602 pts
SeverityFileLineSnippet
LOWcrates/polars-buffer/src/buffer.rs1use std::ops::{Deref, Range, RangeBounds};
LOWcrates/polars-buffer/src/buffer.rs21/// ```
LOWcrates/polars-buffer/src/buffer.rs181 // SAFETY: invariant of this struct `offset + length <= data.len()`.
LOWcrates/polars-buffer/src/buffer.rs241 /// the index `mid` itself) and the second will contain all
LOWcrates/polars-expr/src/hash_keys.rs201
LOWcrates/polars-expr/src/expressions/window.rs141 // The example below shows the naive version without group tuple mapping
LOWcrates/polars-expr/src/expressions/window.rs301 match (self.mapping, ac.agg_state()) {
LOWcrates/polars-expr/src/expressions/window.rs361 // this stores all group values on the original df size
LOWcrates/polars-expr/src/expressions/mod.rs141 /// 1. already aggregated as list
LOWcrates/polars-expr/src/expressions/mod.rs521 AggState::LiteralScalar(c) => (c, groups),
LOWcrates/polars-expr/src/expressions/mod.rs541 // [0, 1],
LOWcrates/polars-expr/src/expressions/mod.rs721 /// Think of sort, slice, filter, shift, etc.
LOWcrates/polars-expr/src/expressions/apply.rs481 // multiple inputs to have a compatible data layout as it invokes `flat_naive()`.
LOWcrates/polars-expr/src/expressions/apply.rs501 // - el = elementwise, no need to aggregate() NotAgg
LOWcrates/polars-expr/src/expressions/apply.rs521 // groups_diverge | el+agg | ga
LOWcrates/polars-mem-engine/src/scan_predicate/mod.rs21/// All the expressions and metadata used to filter out rows using predicates.
LOWcrates/polars-plan/src/bin/dsl-schema.rs1//! A tool for working with DSL schema.
LOWcrates/polars-plan/src/plans/options.rs61 /// expression is the output name.
LOWcrates/polars-plan/src/plans/options.rs81 /// the following functions based on the output type and number of elements:
LOW…polars-plan/src/plans/optimizer/slice_pushdown_expr.rs301 // We propagate upwards the position of the last non-elementwise node(s), these represent
LOW…olars-plan/src/plans/optimizer/collapse_and_project.rs1use std::collections::BTreeSet;
LOW…ars-plan/src/plans/optimizer/parquet_metadata_prune.rs1//! Prune `FileScanIR::Parquet::metadata` to projected + predicate columns.
LOW…rs-plan/src/plans/optimizer/predicate_pushdown/join.rs761 let mut project_to_original: Option<Vec<ExprIR>> = None;
LOW…es/polars-plan/src/plans/optimizer/cse/cache_states.rs61 // Only filter and projection nodes are allowed, any other node we stop.
LOW…es/polars-plan/src/plans/optimizer/cse/cache_states.rs81// |--------------------|-------------------|
LOW…es/polars-plan/src/plans/optimizer/cse/cache_states.rs101// |
LOWcrates/polars-plan/src/plans/optimizer/cse/csee.rs261 Entered(usize),
LOWcrates/polars-plan/src/plans/optimizer/cse/csee.rs301 }
LOWcrates/polars-plan/src/plans/optimizer/cse/csee.rs321//
LOWcrates/polars-plan/src/plans/optimizer/cse/csee.rs341// post-visit: col(bar) EEE EEI id: col(bar)
LOWcrates/polars-plan/src/plans/optimizer/cse/csee.rs601// Expression tree with [pre-visit,post-visit] indices
LOWcrates/polars-plan/src/plans/optimizer/cse/csee.rs621// in this tree `col(foo).sum()` should be post-visited/mutated
LOWcrates/polars-plan/src/plans/python/pyarrow.rs141 #[cfg(feature = "dtype-struct")]
LOW…ates/polars-plan/src/plans/conversion/convert_utils.rs1use super::*;
LOW…lars-plan/src/plans/conversion/type_coercion/binary.rs421 if dtype_lhs == lit_rhs.dtype() {
LOW…lars-plan/src/plans/conversion/type_coercion/binary.rs441 // │ --- ┆ --- ┆ --- │
LOWcrates/polars-plan/src/plans/aexpr/minterm_iter.rs1use polars_utils::arena::{Arena, Node};
LOWcrates/polars-plan/src/plans/aexpr/determinism.rs1use polars_utils::idx_vec::UnitVec;
LOWcrates/polars-plan/src/plans/aexpr/determinism.rs41 #[cfg(feature = "dtype-struct")]
LOWcrates/polars-plan/src/plans/aexpr/or_factoring.rs1//! OR factoring: `(A∧X) ∨ (A∧Y) → A ∧ (X∨Y)`
LOWcrates/polars-plan/src/plans/aexpr/predicates/mod.rs41/// is `true` iff a null was dropped; under `nulls_equal=true` the caller must
LOW…polars-plan/src/plans/aexpr/predicates/skip_batches.rs21///
LOW…ates/polars-plan/src/plans/aexpr/properties/general.rs201 /// e.g. non-strict cast
LOWcrates/polars-plan/src/frame/opt_state.rs21 /// Run common-subplan-elimination. This elides duplicate plans and caches their
LOWcrates/polars-plan/src/dsl/list.rs201 }
LOWcrates/polars-plan/src/dsl/arity.rs81
LOWcrates/polars-plan/src/dsl/arity.rs101 // .otherwise( |
LOWcrates/polars-plan/src/dsl/mod.rs381 /// # use polars_core::prelude::*;
LOWcrates/polars-plan/src/dsl/mod.rs781 /// This is similar to a group_by + aggregation + self join.
LOWcrates/polars-plan/src/dsl/mod.rs801 /// sum("values").over([col("groups")]),
LOWcrates/polars-plan/src/dsl/mod.rs1041 /// # Example
LOWcrates/polars-plan/src/dsl/mod.rs1441 self.map_binary(FunctionExpr::Diff(null_behavior), n)
LOWcrates/polars-plan/src/dsl/mod.rs1521 /// If `ignore_nulls` is `False`, [Kleene logic] is used to deal with nulls:
LOWcrates/polars-plan/src/dsl/string.rs201 /// Pad the end of the string until it reaches the given length.
LOWcrates/polars-plan/src/dsl/string.rs461 self.0.map_unary(StringFunction::Titlecase)
LOWcrates/polars-plan/src/dsl/name.rs1#[cfg(feature = "dtype-struct")]
LOWcrates/polars-plan/src/dsl/options/mod.rs281#[derive(Clone, Debug, Eq, PartialEq, Default, Hash)]
LOWcrates/polars-plan/src/dsl/functions/selectors.rs1use super::*;
LOWcrates/polars-plan/src/dsl/functions/temporal.rs21/// at once.
LOWcrates/polars-plan/src/dsl/functions/temporal.rs221 time_zone,
591 more matches not shown…
Deep Nesting129 hits · 126 pts
SeverityFileLineSnippet
LOWpy-polars/tests/conftest.py25
LOWpy-polars/tests/conftest.py110
LOWpy-polars/tests/unit/datatypes/test_float.py149
LOWpy-polars/tests/unit/io/test_delta_deletion_vector.py167
LOWpy-polars/tests/unit/meta/test_config.py604
LOWpy-polars/tests/unit/meta/test_api.py129
LOWpy-polars/tests/unit/operations/test_bitwise.py89
LOW…polars/tests/unit/operations/test_row_encoding_sort.py37
LOWpy-polars/tests/unit/operations/test_slice.py404
LOWpy-polars/tests/unit/operations/test_inequality_join.py312
LOW…-polars/tests/unit/operations/test_group_by_dynamic.py1213
LOW…polars/tests/unit/functions/range/test_linear_space.py31
LOWpy-polars/tests/unit/lazyframe/test_optimizations.py283
LOWpy-polars/src/polars/selectors.py273
LOWpy-polars/src/polars/selectors.py1017
LOWpy-polars/src/polars/selectors.py1207
LOWpy-polars/src/polars/selectors.py358
LOWpy-polars/src/polars/series/series.py9721
LOWpy-polars/src/polars/series/series.py266
LOWpy-polars/src/polars/series/series.py849
LOWpy-polars/src/polars/series/series.py1153
LOWpy-polars/src/polars/series/series.py1620
LOWpy-polars/src/polars/series/series.py4782
LOWpy-polars/src/polars/series/utils.py26
LOWpy-polars/src/polars/_utils/slice.py83
LOWpy-polars/src/polars/_utils/slice.py124
LOWpy-polars/src/polars/_utils/various.py294
LOWpy-polars/src/polars/_utils/various.py311
LOWpy-polars/src/polars/_utils/various.py523
LOWpy-polars/src/polars/_utils/various.py680
LOWpy-polars/src/polars/_utils/deprecation.py334
LOWpy-polars/src/polars/_utils/serde.py34
LOWpy-polars/src/polars/_utils/getitem.py50
LOWpy-polars/src/polars/_utils/getitem.py182
LOWpy-polars/src/polars/_utils/getitem.py291
LOWpy-polars/src/polars/_utils/udfs.py345
LOWpy-polars/src/polars/_utils/udfs.py1186
LOWpy-polars/src/polars/_utils/udfs.py425
LOWpy-polars/src/polars/_utils/udfs.py654
LOWpy-polars/src/polars/_utils/udfs.py677
LOWpy-polars/src/polars/_utils/udfs.py949
LOWpy-polars/src/polars/_utils/udfs.py1050
LOWpy-polars/src/polars/_utils/udfs.py1152
LOWpy-polars/src/polars/_utils/nest_asyncio.py171
LOWpy-polars/src/polars/_utils/nest_asyncio.py242
LOWpy-polars/src/polars/_utils/nest_asyncio.py121
LOWpy-polars/src/polars/_utils/nest_asyncio.py266
LOWpy-polars/src/polars/_utils/nest_asyncio.py321
LOWpy-polars/src/polars/_utils/parse/expr.py22
LOWpy-polars/src/polars/_utils/parse/expr.py162
LOWpy-polars/src/polars/_utils/construction/dataframe.py287
LOWpy-polars/src/polars/_utils/construction/dataframe.py337
LOWpy-polars/src/polars/_utils/construction/dataframe.py476
LOWpy-polars/src/polars/_utils/construction/dataframe.py543
LOWpy-polars/src/polars/_utils/construction/dataframe.py967
LOWpy-polars/src/polars/_utils/construction/dataframe.py1213
LOWpy-polars/src/polars/_utils/construction/series.py76
LOWpy-polars/src/polars/_utils/construction/series.py447
LOWpy-polars/src/polars/_utils/construction/utils.py86
LOWpy-polars/src/polars/dataframe/frame.py378
69 more matches not shown…
AI Slop Vocabulary21 hits · 62 pts
SeverityFileLineSnippet
MEDIUMcrates/polars-expr/src/expressions/structeval.rs300 // elementwise top-level and not fallible. We leverage the reference dispatch for ApplyExpr,
MEDIUM…polars-plan/src/plans/aexpr/predicates/skip_batches.rs553 // Essentially, what this does is
MEDIUMcrates/polars-core/src/series/arithmetic/list.rs271 // * Essentially as if the NULL primitive was added to every primitive in the row of the list column.
MEDIUMcrates/polars-core/src/chunked_array/mod.rs122/// When multiplying two [`ChunkedArray`]s with different chunk sizes they cannot utilize [SIMD](https://en.wikipedia.or
MEDIUMcrates/polars-core/src/chunked_array/logical/time.rs12 // Invalid time values are replaced with `null` during the arrow cast. We utilize the
MEDIUMcrates/polars-core/src/frame/column/mod.rs720 // We utilize the aggregation on Series to see:
MEDIUMcrates/polars-arrow/src/array/mod.rs547 /// This is an API to leverage clone-on-write
MEDIUMcrates/polars-arrow/src/array/utf8/mutable.rs222 /// This is an API to leverage clone-on-write
MEDIUMcrates/polars-arrow/src/array/utf8/mod.rs480 /// This is an API to leverage clone-on-write
MEDIUMcrates/polars-io/src/parquet/read/read_impl.rs496 // faster. Essentially, it sees how many times it needs to switch between
MEDIUMcrates/polars-stream/src/nodes/joins/equi_join.rs1022 // TODO: implement something more re-usable and robust.
MEDIUMcrates/polars/tests/it/io/parquet/read/mod.rs3/// In comparison to Arrow, this in-memory format does not leverage logical types nor SIMD operations,
MEDIUMpy-polars/tests/unit/io/test_spreadsheet.py628 # read multiple sheets in conjunction with 'schema_overrides'
MEDIUMpy-polars/tests/unit/io/test_delta_deletion_vector.py29# explicitly not comprehensive and should be used with care.
MEDIUM…ests/unit/operations/namespaces/temporal/test_round.py123 # Definitely uses slowpath:
MEDIUM…s/unit/operations/namespaces/temporal/test_truncate.py120 # Definitely uses slowpath:
MEDIUM…/tests/unit/testing/parametric/strategies/test_core.py301 # ensure dtype constraint works in conjunction with 'n' cols
MEDIUMpy-polars/tests/unit/constructors/test_constructors.py253 # in conjunction with full 'columns' override (rename/downcast)
MEDIUMpy-polars/src/polars/_utils/construction/series.py358 # # Essentially, when given a [0, u64::MAX] then it would Overflow.
MEDIUMpy-polars/src/polars/io/spreadsheet/_write_utils.py239 """Insert dummy frame columns in order to create empty/named table columns."""
MEDIUMpy-polars/src/polars/functions/col.py120 # note: using `co_qualname` is more robust; can additionally
Cross-File Repetition9 hits · 45 pts
SeverityFileLineSnippet
HIGHpy-polars/tests/unit/io/database/test_read.py0select cast(strftime('%y',"date") as int) as "year", name, value from test_data where value < {n}
HIGHpy-polars/tests/unit/io/database/test_read.py0select cast(strftime('%y',"date") as int) as "year", name, value from test_data where value < {n}
HIGHpy-polars/tests/unit/io/database/test_read.py0select cast(strftime('%y',"date") as int) as "year", name, value from test_data where value < {n}
HIGHpy-polars/tests/unit/io/database/test_read.py0select cast(strftime('%y',"date") as int) as "year", name, value from test_data where value between {param_1} and {param
HIGHpy-polars/tests/unit/io/database/test_read.py0select cast(strftime('%y',"date") as int) as "year", name, value from test_data where value between {param_1} and {param
HIGHpy-polars/tests/unit/io/database/test_read.py0select cast(strftime('%y',"date") as int) as "year", name, value from test_data where value between {param_1} and {param
HIGHpy-polars/src/polars/string_cache.py0does nothing. .. deprecated:: 1.41.0 the string cache was used to maintain the mapping for the categorical dtype, this i
HIGHpy-polars/src/polars/string_cache.py0does nothing. .. deprecated:: 1.41.0 the string cache was used to maintain the mapping for the categorical dtype, this i
HIGHpy-polars/src/polars/string_cache.py0does nothing. .. deprecated:: 1.41.0 the string cache was used to maintain the mapping for the categorical dtype, this i
Self-Referential Comments13 hits · 38 pts
SeverityFileLineSnippet
MEDIUMpy-polars/tests/unit/datatypes/test_list.py117 # Create a left relation where the join column contains a null value.
MEDIUMpy-polars/tests/unit/datatypes/test_list.py123 # Create a right relation where there is a column to count distinct on.
MEDIUMpy-polars/tests/unit/datatypes/test_temporal.py2368 # Create a Series where the null value is backed by a value which would
MEDIUMpy-polars/tests/unit/interop/test_interop.py374 # Create a pyarrow table with a list[null] column.
MEDIUMpy-polars/tests/unit/interop/test_interop.py349 # Create an enum / categorical / dictionary typed pyarrow array
MEDIUMpy-polars/tests/unit/interop/test_interop.py872 # Create a dataset with 3 rows
MEDIUMpy-polars/tests/unit/io/test_parquet.py140 # Create a dataframe with 3 chunks:
MEDIUMpy-polars/tests/unit/io/test_delta_deletion_vector.py27# This file contains temporary homegrown logic with the sole purpose of generating
MEDIUM…s/unit/operations/namespaces/temporal/test_datetime.py615 # Define a DataFrame with columns for datetime, date, and time
MEDIUMpy-polars/tests/unit/sql/test_set_ops.py111 # Create a context and register the tables
MEDIUMpy-polars/src/polars/_plr.py1# This module represents the Rust API functions exposed to Python through PyO3. We do a
MEDIUM…ython/user-guide/expressions/user-defined-functions.py108 # Create a struct that has two columns in it:
MEDIUM.github/workflows/release-python.yml10 # Create the sdist and build the wheels, but do not publish to PyPI / GitHub.
Excessive Try-Catch Wrapping25 hits · 26 pts
SeverityFileLineSnippet
LOWpy-polars/tests/unit/io/test_skip_batch_predicate.py195 except Exception as _:
LOWpy-polars/tests/unit/io/test_skip_batch_predicate.py228 except Exception as _:
LOWpy-polars/tests/unit/io/test_delta_deletion_vector.py216 except Exception:
LOWpy-polars/tests/unit/io/test_multiscan.py226 except Exception as _:
LOWpy-polars/tests/unit/meta/test_api.py139 except Exception:
LOWpy-polars/src/polars/_cpu_check.py66 except Exception:
LOWpy-polars/src/polars/series/utils.py185 except Exception:
LOWpy-polars/src/polars/datatypes/convert.py352 except Exception:
LOWpy-polars/src/polars/catalog/unity/client.py665 except Exception as e:
LOWpy-polars/src/polars/io/plugins.py86 except Exception as e:
LOWpy-polars/src/polars/io/database/_executor.py249 except Exception as err:
LOWpy-polars/src/polars/io/iceberg/_dataset.py172 except Exception as error:
LOWpy-polars/src/polars/io/iceberg/_utils.py395 except Exception as e:
LOW…rs/src/polars/io/cloud/credential_provider/_builder.py220 except Exception as e:
LOW…/src/polars/io/cloud/credential_provider/_providers.py427 except Exception as e:
LOW…/src/polars/io/cloud/credential_provider/_providers.py492 except Exception:
MEDIUM…/src/polars/io/cloud/credential_provider/_providers.py489def _azcli_version(cls) -> str | None:
LOWpy-polars/src/polars/meta/versions.py117 except Exception:
LOWpy-polars/src/polars/convert/general.py1158 except Exception as exc:
LOWpy-polars/src/polars/lazyframe/frame.py832 except Exception:
MEDIUMpy-polars/src/polars/lazyframe/frame.py822def _repr_html_(self) -> str:
LOWdocs/source/_build/scripts/people.py35 except Exception as e:
LOWdocs/source/src/python/user-guide/io/hive.py79except Exception as e:
LOW…urce/src/python/user-guide/expressions/categoricals.py156except Exception as e:
LOWdocs/source/src/python/user-guide/lazy/schema.py19except Exception as e:
Synthetic Comment Markers2 hits · 12 pts
SeverityFileLineSnippet
HIGH…stream/src/nodes/io_sources/ipc/record_batch_decode.rs35 // Rows as requested, relative to the start of the Record Batch.
HIGHdocs/source/development/contributing/index.md307- If your contribution contains code generated by AI you **must**:
Fake / Example Data8 hits · 12 pts
SeverityFileLineSnippet
LOWcrates/polars/tests/it/io/csv.rs418-86.64408227,"Lorem Ipsum is simply dummy text of the printing and typesetting
LOWcrates/polars/tests/it/io/csv.rs419industry. Lorem Ipsum has been the industry's standard dummy text ever since th
LOWcrates/polars/tests/it/io/csv.rs423in the 1960s with the release of Letraset sheets containing Lorem Ipsum passages,
LOWcrates/polars/tests/it/io/csv.rs425versions of Lorem Ipsum.",11
LOWcrates/polars/tests/it/io/csv.rs436 r#"Lorem Ipsum is simply dummy text of the printing and typesetting
LOWcrates/polars/tests/it/io/csv.rs437industry. Lorem Ipsum has been the industry's standard dummy text ever since th
LOWcrates/polars/tests/it/io/csv.rs441in the 1960s with the release of Letraset sheets containing Lorem Ipsum passages,
LOWcrates/polars/tests/it/io/csv.rs443versions of Lorem Ipsum."#,
Redundant / Tautological Comments7 hits · 10 pts
SeverityFileLineSnippet
LOWpy-polars/tests/unit/io/test_delta_deletion_vector.py260 # Set statistics to pre-deletion-vector values
LOWpy-polars/tests/unit/operations/test_is_in.py250 # Check if empty list is converted to pl.String
LOW…rs/tests/unit/operations/arithmetic/test_arithmetic.py211 # Check if fused is turned off for literals see: #9857
LOWpy-polars/tests/unit/lazyframe/test_cse.py899 # Check if output is stable
LOWpy-polars/tests/docs/run_doctest.py116 # Set doctests to fail on warnings
LOWpy-polars/src/polars/_utils/various.py155 # Check if an object is a sequence of `tp`, only sniffing the first element.
LOWdocs/source/_build/scripts/macro.py183 # Check if file exists for the language
Slop Phrases3 hits · 5 pts
SeverityFileLineSnippet
LOW…ts/unit/operations/map/test_inefficient_map_warning.py576 # make sure to keep the `^` and `$`, and the assertion on `len(warnings)`
LOWdocs/source/src/python/polars-cloud/remote-query.py41 # make sure to enter your own workspace name
MEDIUM…le/derive_expression/expression_lib/src/expressions.rs205/// This expression is for demonstration purposes as we have a dedicated
Dead Code1 hit · 2 pts
SeverityFileLineSnippet
MEDIUMpy-polars/tests/unit/interop/test_arrow_stream_error.py22
Verbosity Indicators1 hit · 2 pts
SeverityFileLineSnippet
LOWcrates/polars-io/src/path_utils/mod.rs223 // We need to check if it is a directory for local paths (we can be here due
Overly Generic Function Names1 hit · 1 pts
SeverityFileLineSnippet
LOWpy-polars/src/polars/lazyframe/opt_flags.py290 def helper(f: QueryOptFlags, field_name: str, value: bool) -> QueryOptFlags: # noqa: FBT001