MCPcopy
hub / github.com/dask/dask / FromArray

Class FromArray

dask/dataframe/dask_expr/io/io.py:633–719  ·  view source on GitHub ↗

Source from the content-addressed store, hash-verified

631
632
633class FromArray(PartitionsFiltered, BlockwiseIO):
634 _parameters = [
635 "frame",
636 "chunksize",
637 "original_columns",
638 "meta",
639 "columns",
640 "_partitions",
641 ]
642 _defaults = {
643 "chunksize": 50_000,
644 "original_columns": None,
645 "meta": None,
646 "columns": None,
647 "_partitions": None,
648 }
649 _absorb_projections = True
650
651 @functools.cached_property
652 def _meta(self):
653 meta = _meta_from_array(
654 self.frame, self.operand("original_columns"), self.operand("meta")
655 )
656 if self.operand("columns") is not None:
657 return meta[self.operand("columns")]
658 return meta
659
660 @functools.cached_property
661 def original_columns(self):
662 if self.operand("original_columns") is None:
663 if is_series_like(self._meta):
664 return [0]
665 return list(range(len(self._meta.columns)))
666 return self.operand("original_columns")
667
668 @functools.cached_property
669 def _column_indices(self):
670 if self.operand("columns") is None:
671 return slice(0, len(self.original_columns))
672 return [
673 i
674 for i, col in enumerate(self.original_columns)
675 if col in self.operand("columns")
676 ]
677
678 def _divisions(self):
679 divisions = tuple(range(0, len(self.frame), self.chunksize))
680 divisions = divisions + (len(self.frame) - 1,)
681 return divisions
682
683 @functools.cached_property
684 def unfiltered_divisions(self):
685 return self._divisions()
686
687 def _filtered_task(self, name: Key, index: int) -> Task:
688 data = self.frame[slice(index * self.chunksize, (index + 1) * self.chunksize)]
689 if index == len(self.unfiltered_divisions) - 2:
690 idx = range(

Callers 1

from_arrayFunction · 0.90

Calls

no outgoing calls

Tested by

no test coverage detected

Used in the wild real call sites across dependent graphs

searching dependent graphs…