You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
The ZipCodes_Stops_PiP_cuSpatial notebook is failing on 24.08 and 24.10, with the most recent nightlies of cuspatial and all its dependencies for those versions.
TypeError Traceback (most recent call last)
File /tmp/tmp.q8TobhA9hO/ZipCodes_Stops_PiP_cuSpatial-test.py:302
299 zipcode_quadtree.set_polygon(d_states, poly_column='geometry')
301 # Join state and zip code boundaries
--> 302 zipcode_by_state = zipcode_quadtree.point_left_join_polygon(["WKT", "ZCTA5CE10"], ["STUSPS"])
...
File copying.pyx:154, in cudf._lib.copying.gather()
File column.pyx:463, in cudf._lib.column.Column.to_pylibcudf()
File column.pyx:493, in cudf._lib.column.Column.to_pylibcudf()
File types.pyx:284, in cudf._lib.types.dtype_to_pylibcudf_type()
TypeError: data type 'geometry' not understood
full stacktrace (click me)
TypeError Traceback (most recent call last)
File /tmp/tmp.xjCxaX16y8/ZipCodes_Stops_PiP_cuSpatial-test.py:302
299 zipcode_quadtree.set_polygon(d_states, poly_column='geometry')
301 # Join state and zip code boundaries
--> 302 zipcode_by_state = zipcode_quadtree.point_left_join_polygon(["WKT", "ZCTA5CE10"], ["STUSPS"])
304 # Get Californian zipcodes
305 CA_zipcode = zipcode_by_state[zipcode_by_state.STUSPS == 'CA']
File /tmp/tmp.xjCxaX16y8/ZipCodes_Stops_PiP_cuSpatial-test.py:281, in QuadTree.point_left_join_polygon(self, point_columns, polygon_columns)
279 points = self.points(point_columns)
280 polygons = self.polygons(polygon_columns)
--> 281 joined = points.merge(polygons, on=["polygon_index", "point_index"], how="left")
282 joined = joined.drop(["polygon_index", "point_index"], axis=1)
283 return cuspatial.GeoDataFrame(joined)
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/utils/performance_tracking.py:51, in _performance_tracking.<locals>.wrapper(*args, **kwargs)
43 if nvtx.enabled():
44 stack.enter_context(
45 nvtx.annotate(
46 message=func.__qualname__,
(...)
49 )
50 )
---> 51 return func(*args, **kwargs)
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/core/dataframe.py:4296, in DataFrame.merge(self, right, how, on, left_on, right_on, left_index, right_index, sort, suffixes, indicator, validate)
4281 elif how in {"leftsemi", "leftanti"}:
4282 merge_cls = MergeSemi
4284 return merge_cls(
4285 lhs,
4286 rhs,
4287 on=on,
4288 left_on=left_on,
4289 right_on=right_on,
4290 left_index=left_index,
4291 right_index=right_index,
4292 how=how,
4293 sort=sort,
4294 indicator=indicator,
4295 suffixes=suffixes,
-> 4296 ).perform_merge()
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/core/join/join.py:285, in Merge.perform_merge(self)
278 left_rows, right_rows = self._gather_maps(
279 left_join_cols, right_join_cols
280 )
281 gather_kwargs = {
282 "keep_index": self._using_left_index or self._using_right_index,
283 }
284 left_result = (
--> 285 self.lhs._gather(
286 GatherMap.from_column_unchecked(
287 left_rows, len(self.lhs), nullify=True
288 ),
289 **gather_kwargs,
290 )
291 if left_rows is not None
292 else cudf.DataFrame._from_data({})
293 )
294 del left_rows
295 right_result = (
296 self.rhs._gather(
297 GatherMap.from_column_unchecked(
(...)
303 else cudf.DataFrame._from_data({})
304 )
File /opt/conda/envs/test/lib/python3.11/site-packages/cuspatial/core/geodataframe.py:220, in GeoDataFrame._gather(self, gather_map, keep_index)
217 geo_gathered = GeoDataFrame(gathered)
219 # combine
--> 220 result = GeoDataFrame(
221 self._recombine_columns(geo_gathered, cudf_gathered)
222 )
223 result.index = geo_gathered.index
224 # return
File /opt/conda/envs/test/lib/python3.11/site-packages/cuspatial/core/geodataframe.py:54, in GeoDataFrame.__init__(self, data)
52 except TypeError:
53 pass
---> 54 super()._init_from_dict_like(
55 data, index=self.index if len(self.index) > 0 else None
56 )
57 elif data is None:
58 pass
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/utils/performance_tracking.py:51, in _performance_tracking.<locals>.wrapper(*args, **kwargs)
43 if nvtx.enabled():
44 stack.enter_context(
45 nvtx.annotate(
46 message=func.__qualname__,
(...)
49 )
50 )
---> 51 return func(*args, **kwargs)
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/core/dataframe.py:1068, in DataFrame._init_from_dict_like(self, data, index, columns, nan_as_null)
1058 empty_column = functools.partial(
1059 cudf.core.column.column_empty,
1060 row_count=(0 if index is None else len(index)),
1061 masked=index is not None,
1062 )
1064 data = {
1065 c: data[c] if c in data else empty_column() for c in columns
1066 }
-> 1068 data, index = self._align_input_series_indices(data, index=index)
1070 if index is None:
1071 num_rows = 0
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/utils/performance_tracking.py:51, in _performance_tracking.<locals>.wrapper(*args, **kwargs)
43 if nvtx.enabled():
44 stack.enter_context(
45 nvtx.annotate(
46 message=func.__qualname__,
(...)
49 )
50 )
---> 51 return func(*args, **kwargs)
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/core/dataframe.py:1143, in DataFrame._align_input_series_indices(data, index)
1137 aligned_input_series = [
1138 sr._align_to_index(index, how="right", sort=False)
1139 for sr in input_series
1140 ]
1142 else:
-> 1143 aligned_input_series = cudf.core.series._align_indices(
1144 input_series
1145 )
1146 index = aligned_input_series[0].index
1148 data = data.copy()
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/utils/performance_tracking.py:51, in _performance_tracking.<locals>.wrapper(*args, **kwargs)
43 if nvtx.enabled():
44 stack.enter_context(
45 nvtx.annotate(
46 message=func.__qualname__,
(...)
49 )
50 )
---> 51 return func(*args, **kwargs)
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/core/series.py:5157, in _align_indices(series_list, how, allow_non_unique)
5154 combined_index.names = new_index_names
5156 # align all Series to the combined index
-> 5157 result = [
5158 sr._align_to_index(
5159 combined_index, how=how, allow_non_unique=allow_non_unique
5160 )
5161 for sr in series_list
5162 ]
5164 return result
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/core/series.py:5158, in <listcomp>(.0)
5154 combined_index.names = new_index_names
5156 # align all Series to the combined index
5157 result = [
-> 5158 sr._align_to_index(
5159 combined_index, how=how, allow_non_unique=allow_non_unique
5160 )
5161 for sr in series_list
5162 ]
5164 return result
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/core/indexed_frame.py:3690, in IndexedFrame._align_to_index(self, index, how, sort, allow_non_unique)
3687 elif how == "right":
3688 rhs[sort_col_id] = as_column(range(len(rhs)))
-> 3690 result = lhs.join(rhs, how=how, sort=sort)
3691 if how in ("left", "right"):
3692 result = result.sort_values(sort_col_id)
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/utils/performance_tracking.py:51, in _performance_tracking.<locals>.wrapper(*args, **kwargs)
43 if nvtx.enabled():
44 stack.enter_context(
45 nvtx.annotate(
46 message=func.__qualname__,
(...)
49 )
50 )
---> 51 return func(*args, **kwargs)
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/core/dataframe.py:4349, in DataFrame.join(self, other, on, how, lsuffix, rsuffix, sort, validate)
4344 elif validate is not None:
4345 raise NotImplementedError(
4346 "The validate parameter is not yet supported"
4347 )
-> 4349 df = self.merge(
4350 other,
4351 left_index=True,
4352 right_index=True,
4353 how=how,
4354 suffixes=(lsuffix, rsuffix),
4355 sort=sort,
4356 )
4357 df.index.name = (
4358 None if self.index.name != other.index.name else self.index.name
4359 )
4360 return df
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/utils/performance_tracking.py:51, in _performance_tracking.<locals>.wrapper(*args, **kwargs)
43 if nvtx.enabled():
44 stack.enter_context(
45 nvtx.annotate(
46 message=func.__qualname__,
(...)
49 )
50 )
---> 51 return func(*args, **kwargs)
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/core/dataframe.py:4296, in DataFrame.merge(self, right, how, on, left_on, right_on, left_index, right_index, sort, suffixes, indicator, validate)
4281 elif how in {"leftsemi", "leftanti"}:
4282 merge_cls = MergeSemi
4284 return merge_cls(
4285 lhs,
4286 rhs,
4287 on=on,
4288 left_on=left_on,
4289 right_on=right_on,
4290 left_index=left_index,
4291 right_index=right_index,
4292 how=how,
4293 sort=sort,
4294 indicator=indicator,
4295 suffixes=suffixes,
-> 4296 ).perform_merge()
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/core/join/join.py:285, in Merge.perform_merge(self)
278 left_rows, right_rows = self._gather_maps(
279 left_join_cols, right_join_cols
280 )
281 gather_kwargs = {
282 "keep_index": self._using_left_index or self._using_right_index,
283 }
284 left_result = (
--> 285 self.lhs._gather(
286 GatherMap.from_column_unchecked(
287 left_rows, len(self.lhs), nullify=True
288 ),
289 **gather_kwargs,
290 )
291 if left_rows is not None
292 else cudf.DataFrame._from_data({})
293 )
294 del left_rows
295 right_result = (
296 self.rhs._gather(
297 GatherMap.from_column_unchecked(
(...)
303 else cudf.DataFrame._from_data({})
304 )
File /opt/conda/envs/test/lib/python3.11/site-packages/cudf/core/indexed_frame.py:2958, in IndexedFrame._gather(self, gather_map, keep_index)
2[955](https://github.com/rapidsai/cuspatial/actions/runs/10199784404/job/28219162698?pr=1424#step:9:956) if not gather_map.nullify and len(self) != gather_map.nrows:
2[956](https://github.com/rapidsai/cuspatial/actions/runs/10199784404/job/28219162698?pr=1424#step:9:957) raise IndexError("Gather map is out of bounds")
2[957](https://github.com/rapidsai/cuspatial/actions/runs/10199784404/job/28219162698?pr=1424#step:9:958) return self._from_columns_like_self(
-> 2958 libcudf.copying.gather(
2959 list(self.index._columns + self._columns)
2960 if keep_index
2961 else list(self._columns),
2962 gather_map.column,
2963 nullify=gather_map.nullify,
2[964](https://github.com/rapidsai/cuspatial/actions/runs/10199784404/job/28219162698?pr=1424#step:9:965) ),
2[965](https://github.com/rapidsai/cuspatial/actions/runs/10199784404/job/28219162698?pr=1424#step:9:966) self._column_names,
2966 self.index.names if keep_index else None,
2[967](https://github.com/rapidsai/cuspatial/actions/runs/10199784404/job/28219162698?pr=1424#step:9:968) )
File /opt/conda/envs/test/lib/python3.11/contextlib.py:81, in ContextDecorator.__call__.<locals>.inner(*args, **kwds)
78 @wraps(func)
79 def inner(*args, **kwds):
80 with self._recreate_cm():
---> 81 return func(*args, **kwds)
File copying.pyx:154, in cudf._lib.copying.gather()
File column.pyx:463, in cudf._lib.column.Column.to_pylibcudf()
File column.pyx:493, in cudf._lib.column.Column.to_pylibcudf()
File types.pyx:284, in cudf._lib.types.dtype_to_pylibcudf_type()
TypeError: data type 'geometry' not understood
Version
24.08
On which installation method(s) does this occur?
Conda
Describe the issue
The
ZipCodes_Stops_PiP_cuSpatial
notebook is failing on 24.08 and 24.10, with the most recent nightlies ofcuspatial
and all its dependencies for those versions.full stacktrace (click me)
(24.08 build link)
(24.10 build link)
Minimum reproducible example
No response
Relevant log output
No response
Environment details
print_env.sh output (click me)
Other/Misc.
Discovered here: #1422 (review)
The text was updated successfully, but these errors were encountered: