Commit bcb99d5

authored

Zip Strict for pandas/core/computation and pandas/core/groupby #62469 (#62510)

1 parent 0557e16 commit bcb99d5Copy full SHA for bcb99d5

File tree

7 files changed

+25

-21

lines changed

pandas/core
- computation
- groupby

7 files changed

+25

-21

lines changed

`‎pandas/core/computation/align.py‎`

Lines changed: 2 additions & 2 deletions

Original file line number	Diff line number	Diff line change
`@@ -93,7 +93,7 @@ def _align_core(terms):`
`93`	`93`
`94`	`94`	`from pandas import Series`
`95`	`95`
`96`		`- ndims = Series(dict(zip(term_index, term_dims)))`
	`96`	`+ ndims = Series(dict(zip(term_index, term_dims, strict=True)))`
`97`	`97`
`98`	`98`	`# initial axes are the axes of the largest-axis'd term`
`99`	`99`	`biggest = terms[ndims.idxmax()].value`
`@@ -116,7 +116,7 @@ def _align_core(terms):`
`116`	`116`	`axes[ax] = axes[ax].union(itm)`
`117`	`117`
`118`	`118`	`for i, ndim in ndims.items():`
`119`		`- for axis, items in zip(range(ndim), axes):`
	`119`	`+ for axis, items in zip(range(ndim), axes, strict=False):`
`120`	`120`	`ti = terms[i].value`
`121`	`121`
`122`	`122`	`if hasattr(ti, "reindex"):`

`‎pandas/core/computation/expr.py‎`

Lines changed: 3 additions & 3 deletions

Original file line number	Diff line number	Diff line change
`@@ -383,11 +383,11 @@ class BaseExprVisitor(ast.NodeVisitor):`
`383`	`383`	`"FloorDiv",`
`384`	`384`	`"Mod",`
`385`	`385`	`)`
`386`		`- binary_op_nodes_map = dict(zip(binary_ops, binary_op_nodes))`
	`386`	`+ binary_op_nodes_map = dict(zip(binary_ops, binary_op_nodes, strict=True))`
`387`	`387`
`388`	`388`	`unary_ops = UNARY_OPS_SYMS`
`389`	`389`	`unary_op_nodes = "UAdd", "USub", "Invert", "Not"`
`390`		`- unary_op_nodes_map = dict(zip(unary_ops, unary_op_nodes))`
	`390`	`+ unary_op_nodes_map = dict(zip(unary_ops, unary_op_nodes, strict=True))`
`391`	`391`
`392`	`392`	`rewrite_map = {`
`393`	`393`	`ast.Eq: ast.In,`
`@@ -731,7 +731,7 @@ def visit_Compare(self, node, **kwargs):`
`731`	`731`	`# recursive case: we have a chained comparison, a CMP b CMP c, etc.`
`732`	`732`	`left = node.left`
`733`	`733`	`values = []`
`734`		`- for op, comp in zip(ops, comps):`
	`734`	`+ for op, comp in zip(ops, comps, strict=True):`
`735`	`735`	`new_node = self.visit(`
`736`	`736`	`ast.Compare(comparators=[comp], left=left, ops=[self.translate_In(op)])`
`737`	`737`	`)`

`‎pandas/core/computation/ops.py‎`

Lines changed: 4 additions & 4 deletions

Original file line number	Diff line number	Diff line change
`@@ -302,11 +302,11 @@ def _not_in(x, y):`
`302`	`302`	`_in,`
`303`	`303`	`_not_in,`
`304`	`304`	`)`
`305`		`-_cmp_ops_dict = dict(zip(CMP_OPS_SYMS, _cmp_ops_funcs))`
	`305`	`+_cmp_ops_dict = dict(zip(CMP_OPS_SYMS, _cmp_ops_funcs, strict=True))`
`306`	`306`
`307`	`307`	`BOOL_OPS_SYMS = ("&", "\|", "and", "or")`
`308`	`308`	`_bool_ops_funcs = (operator.and_, operator.or_, operator.and_, operator.or_)`
`309`		`-_bool_ops_dict = dict(zip(BOOL_OPS_SYMS, _bool_ops_funcs))`
	`309`	`+_bool_ops_dict = dict(zip(BOOL_OPS_SYMS, _bool_ops_funcs, strict=True))`
`310`	`310`
`311`	`311`	`ARITH_OPS_SYMS = ("+", "-", "", "/", "*", "//", "%")`
`312`	`312`	`_arith_ops_funcs = (`
`@@ -318,7 +318,7 @@ def _not_in(x, y):`
`318`	`318`	`operator.floordiv,`
`319`	`319`	`operator.mod,`
`320`	`320`	`)`
`321`		`-_arith_ops_dict = dict(zip(ARITH_OPS_SYMS, _arith_ops_funcs))`
	`321`	`+_arith_ops_dict = dict(zip(ARITH_OPS_SYMS, _arith_ops_funcs, strict=True))`
`322`	`322`
`323`	`323`	`_binary_ops_dict = {}`
`324`	`324`
`@@ -484,7 +484,7 @@ def _disallow_scalar_only_bool_ops(self) -> None:`
`484`	`484`
`485`	`485`	`UNARY_OPS_SYMS = ("+", "-", "~", "not")`
`486`	`486`	`_unary_ops_funcs = (operator.pos, operator.neg, operator.invert, operator.invert)`
`487`		`-_unary_ops_dict = dict(zip(UNARY_OPS_SYMS, _unary_ops_funcs))`
	`487`	`+_unary_ops_dict = dict(zip(UNARY_OPS_SYMS, _unary_ops_funcs, strict=True))`
`488`	`488`
`489`	`489`
`490`	`490`	`class UnaryOp(Op):`

`‎pandas/core/groupby/generic.py‎`

Lines changed: 1 addition & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -536,7 +536,7 @@ def _aggregate_multiple_funcs(self, arg, args, *kwargs) -> DataFrame:`
`536`	`536`	`else:`
`537`	`537`	`# list of functions / function names`
`538`	`538`	`columns = (com.get_callable_name(f) or f for f in arg)`
`539`		`- arg = zip(columns, arg)`
	`539`	`+ arg = zip(columns, arg, strict=True)`
`540`	`540`
`541`	`541`	`results: dict[base.OutputKey, DataFrame \| Series] = {}`
`542`	`542`	`with com.temp_setattr(self, "as_index", True):`

`‎pandas/core/groupby/groupby.py‎`

Lines changed: 5 additions & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -682,7 +682,10 @@ def get_converter(s):`
`682`	`682`	`raise ValueError(msg) from err`
`683`	`683`
`684`	`684`	`converters = (get_converter(s) for s in index_sample)`
`685`		`- names = (tuple(f(n) for f, n in zip(converters, name)) for name in names)`
	`685`	`+ names = (`
	`686`	`+ tuple(f(n) for f, n in zip(converters, name, strict=True))`
	`687`	`+ for name in names`
	`688`	`+ )`
`686`	`689`
`687`	`690`	`else:`
`688`	`691`	`converter = get_converter(index_sample)`
`@@ -1235,6 +1238,7 @@ def _insert_inaxis_grouper(`
`1235`	`1238`	`zip(`
`1236`	`1239`	`reversed(self._grouper.names),`
`1237`	`1240`	`self._grouper.get_group_levels(),`
	`1241`	`+ strict=True,`
`1238`	`1242`	`)`
`1239`	`1243`	`):`
`1240`	`1244`	`if name is None:`

`‎pandas/core/groupby/grouper.py‎`

Lines changed: 3 additions & 3 deletions

Original file line number	Diff line number	Diff line change
`@@ -684,9 +684,9 @@ def groups(self) -> dict[Hashable, Index]:`
`684`	`684`
`685`	`685`	`r, counts = libalgos.groupsort_indexer(ensure_platform_int(codes), len(uniques))`
`686`	`686`	`counts = ensure_int64(counts).cumsum()`
`687`		`- _result = (r[start:end] for start, end in zip(counts, counts[1:]))`
	`687`	`+ _result = (r[start:end] for start, end in zip(counts, counts[1:], strict=False))`
`688`	`688`	`# map to the label`
`689`		`- result = {k: self._index.take(v) for k, v in zip(uniques, _result)}`
	`689`	`+ result = {k: self._index.take(v) for k, v in zip(uniques, _result, strict=True)}`
`690`	`690`
`691`	`691`	`return PrettyDict(result)`
`692`	`692`
`@@ -875,7 +875,7 @@ def is_in_obj(gpr) -> bool:`
`875`	`875`	`return gpr._mgr.references_same_values(obj_gpr_column._mgr, 0)`
`876`	`876`	`return False`
`877`	`877`
`878`		`- for gpr, level in zip(keys, levels):`
	`878`	`+ for gpr, level in zip(keys, levels, strict=True):`
`879`	`879`	`if is_in_obj(gpr): # df.groupby(df['name'])`
`880`	`880`	`in_axis = True`
`881`	`881`	`exclusions.add(gpr.name)`

`‎pandas/core/groupby/ops.py‎`

Lines changed: 7 additions & 7 deletions

Original file line number	Diff line number	Diff line change
`@@ -625,7 +625,7 @@ def get_iterator(self, data: NDFrameT) -> Iterator[tuple[Hashable, NDFrameT]]:`
`625`	`625`	`splitter = self._get_splitter(data)`
`626`	`626`	`# TODO: Would be more efficient to skip unobserved for transforms`
`627`	`627`	`keys = self.result_index`
`628`		`- yield from zip(keys, splitter)`
	`628`	`+ yield from zip(keys, splitter, strict=True)`
`629`	`629`
`630`	`630`	`@final`
`631`	`631`	`def _get_splitter(self, data: NDFrame) -> DataSplitter:`
`@@ -766,7 +766,7 @@ def result_index_and_ids(self) -> tuple[Index, npt.NDArray[np.intp]]:`
`766`	`766`	`]`
`767`	`767`	`sorts = [ping._sort for ping in self.groupings]`
`768`	`768`	`# When passed a categorical grouping, keep all categories`
`769`		`- for k, (ping, level) in enumerate(zip(self.groupings, levels)):`
	`769`	`+ for k, (ping, level) in enumerate(zip(self.groupings, levels, strict=True)):`
`770`	`770`	`if ping._passed_categorical:`
`771`	`771`	`levels[k] = level.set_categories(ping._orig_cats)`
`772`	`772`
`@@ -997,7 +997,7 @@ def apply_groupwise(`
`997`	`997`	`result_values = []`
`998`	`998`
`999`	`999`	`# This calls DataSplitter.__iter__`
`1000`		`- zipped = zip(group_keys, splitter)`
	`1000`	`+ zipped = zip(group_keys, splitter, strict=True)`
`1001`	`1001`
`1002`	`1002`	`for key, group in zipped:`
`1003`	`1003`	`# Pinning name is needed for`
`@@ -1095,7 +1095,7 @@ def groups(self):`
`1095`	`1095`	`# GH 3881`
`1096`	`1096`	`result = {`
`1097`	`1097`	`key: value`
`1098`		`- for key, value in zip(self.binlabels, self.bins)`
	`1098`	`+ for key, value in zip(self.binlabels, self.bins, strict=True)`
`1099`	`1099`	`if key is not NaT`
`1100`	`1100`	`}`
`1101`	`1101`	`return result`
`@@ -1126,7 +1126,7 @@ def get_iterator(self, data: NDFrame):`
`1126`	`1126`	`slicer = lambda start, edge: data.iloc[start:edge]`
`1127`	`1127`
`1128`	`1128`	`start: np.int64 \| int = 0`
`1129`		`- for edge, label in zip(self.bins, self.binlabels):`
	`1129`	`+ for edge, label in zip(self.bins, self.binlabels, strict=True):`
`1130`	`1130`	`if label is not NaT:`
`1131`	`1131`	`yield label, slicer(start, edge)`
`1132`	`1132`	`start = edge`
`@@ -1139,7 +1139,7 @@ def indices(self):`
`1139`	`1139`	`indices = collections.defaultdict(list)`
`1140`	`1140`
`1141`	`1141`	`i: np.int64 \| int = 0`
`1142`		`- for label, bin in zip(self.binlabels, self.bins):`
	`1142`	`+ for label, bin in zip(self.binlabels, self.bins, strict=True):`
`1143`	`1143`	`if i < bin:`
`1144`	`1144`	`if label is not NaT:`
`1145`	`1145`	`indices[label] = list(range(i, bin))`
`@@ -1229,7 +1229,7 @@ def __iter__(self) -> Iterator:`
`1229`	`1229`
`1230`	`1230`	`starts, ends = lib.generate_slices(self._slabels, self.ngroups)`
`1231`	`1231`	`sdata = self._sorted_data`
`1232`		`- for start, end in zip(starts, ends):`
	`1232`	`+ for start, end in zip(starts, ends, strict=True):`
`1233`	`1233`	`yield self._chop(sdata, slice(start, end))`
`1234`	`1234`
`1235`	`1235`	`@cache_readonly`

0 commit comments

Comments

(0)

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Uh oh!

Commit bcb99d5

File tree

7 files changed

7 files changed

`‎pandas/core/computation/align.py‎`

`‎pandas/core/computation/expr.py‎`

`‎pandas/core/computation/ops.py‎`

`‎pandas/core/groupby/generic.py‎`

`‎pandas/core/groupby/groupby.py‎`

`‎pandas/core/groupby/grouper.py‎`

`‎pandas/core/groupby/ops.py‎`

0 commit comments