diff --git a/src/cuda_histogram/axis/__init__.py b/src/cuda_histogram/axis/__init__.py
index 0613cc2..cdb3d2a 100644
--- a/src/cuda_histogram/axis/__init__.py
+++ b/src/cuda_histogram/axis/__init__.py
@@ -1,12 +1,13 @@
 from __future__ import annotations
 
 import functools
-import numbers
 import re
 import warnings
+from typing import Any, Iterable
 
-import awkward
+import boost_histogram.axis as bha
 import cupy
+import hist
 import numpy as np
 
 __all__: list[str] = [
@@ -32,21 +33,11 @@
 )
 
 
-def _overflow_behavior(overflow):
-    if overflow == "none":
-        return slice(1, -2)
-    elif overflow == "under":
-        return slice(None, -2)
-    elif overflow == "over":
+def _overflow_behavior(flow):
+    if not flow:
         return slice(1, -1)
-    elif overflow == "all":
-        return slice(None, -1)
-    elif overflow == "allnan":
-        return slice(None)
-    elif overflow == "justnan":
-        return slice(-1, None)
     else:
-        raise ValueError(f"Unrecognized overflow behavior: {overflow}")
+        return slice(None, None)
 
 
 @functools.total_ordering
@@ -383,27 +374,7 @@ def identifiers(self):
         return [self._bins[k] for k in self._sorted]
 
 
-class DenseAxis(Axis):
-    """
-    DenseAxis: ABC for a fixed-size densely-indexed axis
-
-    Derived should implement:
-        **index(identifier)** - return an index
-
-        **__eq__(axis)** - axis has same definition and binning
-
-        **__getitem__(index)** - return an identifier
-
-        **_ireduce(slice)** - return a slice or list of indices, input slice to be interpred as values
-
-        **reduced(islice)** - return a new axis with binning corresponding to the index slice (from _ireduce)
-
-    TODO: hasoverflow(), not all dense axes might have an overflow concept,
-    currently it is implicitly assumed they do (as the only dense type is a numeric axis)
-    """
-
-
-class Bin(DenseAxis):
+class Regular(hist.axis.Regular, family="cuda_histogram"):
     """A binned axis with name, label, and binning.
 
     Parameters
@@ -425,295 +396,84 @@ class Bin(DenseAxis):
     Bin boundaries are [lo, hi)
     """
 
-    def __init__(self, name, label, n_or_arr, lo=None, hi=None):
-        super().__init__(name, label)
-        self._lazy_intervals = None
-        if isinstance(n_or_arr, (list, np.ndarray, cupy.ndarray)):
-            self._uniform = False
-            self._bins = cupy.array(n_or_arr, dtype="d")
-            if not all(np.sort(self._bins) == self._bins):
-                raise ValueError("Binning not sorted!")
-            self._lo = self._bins[0]
-            self._hi = self._bins[-1]
-            # to make searchsorted differentiate inf from nan
-            self._bins = cupy.append(self._bins, cupy.inf)
-            self._interval_bins = cupy.r_[-cupy.inf, self._bins, cupy.nan]
-            self._bin_names = np.full(self._interval_bins[:-1].size, None)
-        elif isinstance(n_or_arr, numbers.Integral):
-            if lo is None or hi is None:
-                raise TypeError(
-                    "Interpreting n_or_arr as uniform binning, please specify lo and hi values"
-                )
-            self._uniform = True
-            self._lo = lo
-            self._hi = hi
-            self._bins = n_or_arr
-            self._interval_bins = cupy.r_[
-                -cupy.inf,
-                cupy.linspace(self._lo, self._hi, self._bins + 1),
-                cupy.inf,
-                cupy.nan,
-            ]
-            self._bin_names = np.full(self._interval_bins[:-1].size, None)
-        else:
-            raise TypeError(
-                f"Cannot understand n_or_arr (nbins or binning array) type {n_or_arr!r}"
-            )
-
-    @property
-    def _intervals(self):
-        if not hasattr(self, "_lazy_intervals") or self._lazy_intervals is None:
-            self._lazy_intervals = [
-                Interval(low, high, bin)
-                for low, high, bin in zip(
-                    self._interval_bins[:-1], self._interval_bins[1:], self._bin_names
-                )
-            ]
-        return self._lazy_intervals
-
-    def __getstate__(self):
-        if hasattr(self, "_lazy_intervals") and self._lazy_intervals is not None:
-            self._bin_names = np.array(
-                [interval.label for interval in self._lazy_intervals]
-            )
-        self.__dict__.pop("_lazy_intervals", None)
-        return self.__dict__
-
-    def __setstate__(self, d):
-        if "_intervals" in d:  # convert old hists to new serialization format
-            _old_intervals = d.pop("_intervals")
-            interval_bins = [i._lo for i in _old_intervals] + [_old_intervals[-1]._hi]
-            d["_interval_bins"] = cupy.array(interval_bins)
-            d["_bin_names"] = np.array([interval._label for interval in _old_intervals])
-        if "_interval_bins" in d and "_bin_names" not in d:
-            d["_bin_names"] = np.full(d["_interval_bins"][:-1].size, None)
-        self.__dict__ = d
-
-    def index(self, identifier):
-        """Index of a identifier or label
-
-        Parameters
-        ----------
-            identifier : float or Interval or np.ndarray
-                The identifier(s) to lookup.  Supports vectorized
-                calls when a numpy 1D array of numbers is passed.
-
-        Returns an integer corresponding to the index in the axis where the histogram would be filled.
-        The integer range includes flow bins: ``0 = underflow, n+1 = overflow, n+2 = nanflow``
-        """
-        isarray = isinstance(identifier, (awkward.Array, cupy.ndarray, np.ndarray))
-        if isarray or isinstance(identifier, numbers.Number):
-            identifier = awkward.to_cupy(identifier)  # cupy.asarray(identifier)
-            if self._uniform:
-                idx = None
-                if isarray:
-                    idx = cupy.zeros_like(identifier)
-                    _clip_bins(float(self._bins), self._lo, self._hi, identifier, idx)
-                else:
-                    idx = np.clip(
-                        np.floor(
-                            (identifier - self._lo)
-                            * float(self._bins)
-                            / (self._hi - self._lo)
-                        )
-                        + 1,
-                        0,
-                        self._bins + 1,
-                    )
-
-                if isinstance(idx, (cupy.ndarray, np.ndarray)):
-                    _replace_nans(
-                        self.size - 1,
-                        idx if idx.dtype.kind == "f" else idx.astype(cupy.float32),
-                    )
-                    idx = idx.astype(int)
-                elif np.isnan(idx):
-                    idx = self.size - 1
-                else:
-                    idx = int(idx)
-                return idx
-            else:
-                return cupy.searchsorted(self._bins, identifier, side="right")
-        elif isinstance(identifier, Interval):
-            if identifier.nan():
-                return self.size - 1
-            for idx, interval in enumerate(self._intervals):
-                if (
-                    interval._lo <= identifier._lo
-                    or cupy.isclose(interval._lo, identifier._lo)
-                ) and (
-                    interval._hi >= identifier._hi
-                    or cupy.isclose(interval._hi, identifier._hi)
-                ):
-                    return idx
-            raise ValueError(
-                f"Axis {self!r} has no interval that fully contains identifier {identifier!r}"
-            )
-        raise TypeError("Request bin indices with a identifier or 1-D array only")
-
-    def __eq__(self, other):
-        if isinstance(other, DenseAxis):
-            if not super().__eq__(other):
-                return False
-            if self._uniform != other._uniform:
-                return False
-            if self._uniform and self._bins != other._bins:
-                return False
-            if not self._uniform and not all(self._bins == other._bins):  # noqa: SIM103
-                return False
-            return True
-        return super().__eq__(other)
-
-    def __getitem__(self, index):
-        return self._intervals[index]
-
-    def _ireduce(self, the_slice):
-        if isinstance(the_slice, numbers.Number):
-            the_slice = slice(the_slice, the_slice)
-        elif isinstance(the_slice, Interval):
-            if the_slice.nan():
-                return slice(-1, None)
-            lo = the_slice._lo if the_slice._lo > -np.inf else None
-            hi = the_slice._hi if the_slice._hi < np.inf else None
-            the_slice = slice(lo, hi)
-        if isinstance(the_slice, slice):
-            blo, bhi = None, None
-            if the_slice.start is not None:
-                if the_slice.start < self._lo:
-                    raise ValueError(
-                        f"Reducing along axis {self!r}: requested start {the_slice.start!r} exceeds bin boundaries (use open slicing, e.g. x[:stop])"
-                    )
-                if self._uniform:
-                    blo_real = (the_slice.start - self._lo) * self._bins / (
-                        self._hi - self._lo
-                    ) + 1
-                    blo = np.clip(np.round(blo_real).astype(int), 0, self._bins + 1)
-                    if abs(blo - blo_real) > 1.0e-14:
-                        warnings.warn(
-                            f"Reducing along axis {self!r}: requested start {the_slice.start!r} between bin boundaries, no interpolation is performed",
-                            RuntimeWarning,
-                        )
-                else:
-                    if the_slice.start not in self._bins:
-                        warnings.warn(
-                            f"Reducing along axis {self!r}: requested start {the_slice.start!r} between bin boundaries, no interpolation is performed",
-                            RuntimeWarning,
-                        )
-                    blo = self.index(the_slice.start)
-            if the_slice.stop is not None:
-                if the_slice.stop > self._hi:
-                    raise ValueError(
-                        f"Reducing along axis {self!r}: requested stop {the_slice.stop!r} exceeds bin boundaries (use open slicing, e.g. x[start:])"
-                    )
-                if self._uniform:
-                    bhi_real = (the_slice.stop - self._lo) * self._bins / (
-                        self._hi - self._lo
-                    ) + 1
-                    bhi = np.clip(np.round(bhi_real).astype(int), 0, self._bins + 1)
-                    if abs(bhi - bhi_real) > 1.0e-14:
-                        warnings.warn(
-                            f"Reducing along axis {self!r}: requested stop {the_slice.stop!r} between bin boundaries, no interpolation is performed",
-                            RuntimeWarning,
-                        )
-                else:
-                    if the_slice.stop not in self._bins:
-                        warnings.warn(
-                            f"Reducing along axis {self!r}: requested stop {the_slice.stop!r} between bin boundaries, no interpolation is performed",
-                            RuntimeWarning,
-                        )
-                    bhi = self.index(the_slice.stop)
-                # Assume null ranges (start==stop) mean we want the bin containing the value
-                if blo is not None and blo == bhi:
-                    bhi += 1
-            if the_slice.step is not None:
-                raise NotImplementedError(
-                    "Step slicing can be interpreted as a rebin factor"
-                )
-            return slice(blo, bhi, the_slice.step)
-        elif isinstance(the_slice, list) and all(
-            isinstance(v, Interval) for v in the_slice
-        ):
-            raise NotImplementedError("Slice histogram from list of intervals")
-        raise IndexError(f"Cannot understand slice {the_slice!r} on axis {self!r}")
-
-    def reduced(self, islice):
-        """Return a new axis with reduced binning
-
-        The new binning corresponds to the slice made on this axis.
-        Overflow will be taken care of by ``Hist.__getitem__``
-
-        Parameters
-        ----------
-            islice : slice
-                ``islice.start`` and ``islice.stop`` should be None or within ``[1, ax.size() - 1]``
-                This slice is usually as returned from ``Bin._ireduce``
-        """
-        if islice.step is not None:
-            raise NotImplementedError(
-                "Step slicing can be interpreted as a rebin factor"
-            )
-        if islice.start is None and islice.stop is None:
-            return self
-        if self._uniform:
-            lo = self._lo
-            ilo = 0
-            if islice.start is not None:
-                lo += (islice.start - 1) * (self._hi - self._lo) / self._bins
-                ilo = islice.start - 1
-            hi = self._hi
-            ihi = self._bins
-            if islice.stop is not None:
-                hi = self._lo + (islice.stop - 1) * (self._hi - self._lo) / self._bins
-                ihi = islice.stop - 1
-            bins = ihi - ilo
-            # TODO: remove this once satisfied it works
-            rbins = (hi - lo) * self._bins / (self._hi - self._lo)
-            assert abs(bins - rbins) < 1e-14, "%d %f %r" % (bins, rbins, self)
-            return Bin(self._name, self._label, bins, lo, hi)
-        else:
-            lo = None if islice.start is None else islice.start - 1
-            hi = -1 if islice.stop is None else islice.stop
-            bins = self._bins[slice(lo, hi)]
-            return Bin(self._name, self._label, bins)
-
-    @property
-    def size(self):
-        """Number of bins, including overflow (i.e. ``n + 3``)"""
-        if self._uniform:
-            return self._bins + 3
-        # (inf added at constructor)
-        return len(self._bins) + 1
+    def __init__(
+        self,
+        bins: int,
+        start: float,
+        stop: float,
+        *,
+        name: str = "",
+        label: str = "",
+        metadata: Any = None,
+        flow: bool = True,
+        underflow: bool | None = None,
+        overflow: bool | None = None,
+        growth: bool = False,
+        circular: bool = False,
+        # pylint: disable-next=redefined-outer-name
+        transform: bha.transform.AxisTransform | None = None,
+        __dict__: dict[str, Any] | None = None,
+    ) -> None:
+        super().__init__(
+            bins,
+            start,
+            stop,
+            metadata=metadata,
+            underflow=flow if underflow is None else underflow,
+            overflow=flow if overflow is None else overflow,
+            growth=growth,
+            circular=circular,
+            transform=transform,
+            __dict__=__dict__,
+        )
+        self._ax.metadata["name"] = name
+        self.label: str = label
 
-    def edges(self, overflow="none"):
-        """Bin boundaries
 
-        Parameters
-        ----------
-            overflow : str
-                Create overflow and/or underflow bins by adding a bin of same width to each end.
-                See `Hist.sum` description for the allowed values.
-        """
-        if self._uniform:
-            out = cupy.linspace(self._lo, self._hi, self._bins + 1)
-        else:
-            out = self._bins[:-1].copy()
-        out = cupy.r_[
-            2 * out[0] - out[1], out, 2 * out[-1] - out[-2], 3 * out[-1] - 2 * out[-2]
-        ]
-        return out[_overflow_behavior(overflow)]
+class Variable(hist.axis.Variable, family="cuda_histogram"):
+    """A binned axis with name, label, and binning.
 
-    def centers(self, overflow="none"):
-        """Bin centers
+    Parameters
+    ----------
+        name : str
+            is used as a keyword in histogram filling, immutable
+        label : str
+            describes the meaning of the axis, can be changed
+        n_or_arr : int or list or np.ndarray
+            Integer number of bins, if uniform binning. Otherwise, a list or
+            numpy 1D array of bin boundaries.
+        lo : float, optional
+            lower boundary of bin range, if uniform binning
+        hi : float, optional
+            upper boundary of bin range, if uniform binning
 
-        Parameters
-        ----------
-            overflow : str
-                Create overflow and/or underflow bins by adding a bin of same width to each end.
-                See `Hist.sum` description for the allowed values.
-        """
-        edges = self.edges(overflow)
-        return (edges[:-1] + edges[1:]) / 2
+    This axis will generate frequencies for n+3 bins, special bin indices:
+    ``0 = underflow, n+1 = overflow, n+2 = nanflow``
+    Bin boundaries are [lo, hi)
+    """
 
-    def identifiers(self, overflow="none"):
-        """List of `Interval` identifiers"""
-        return self._intervals[_overflow_behavior(overflow)]
+    def __init__(
+        self,
+        edges: Iterable[float],
+        *,
+        name: str = "",
+        label: str = "",
+        metadata: Any = None,
+        flow: bool = True,
+        underflow: bool | None = None,
+        overflow: bool | None = None,
+        growth: bool = False,
+        circular: bool = False,
+        __dict__: dict[str, Any] | None = None,
+    ) -> None:
+        super().__init__(
+            edges,
+            metadata=metadata,
+            underflow=flow if underflow is None else underflow,
+            overflow=flow if overflow is None else overflow,
+            growth=growth,
+            circular=circular,
+            __dict__=__dict__,
+        )
+        self._ax.metadata["name"] = name
+        self.label: str = label
diff --git a/src/cuda_histogram/hist.py b/src/cuda_histogram/hist.py
index 1f28c2e..c7c649e 100644
--- a/src/cuda_histogram/hist.py
+++ b/src/cuda_histogram/hist.py
@@ -1,744 +1,158 @@
 from __future__ import annotations
 
-import copy
 import numbers
-import warnings
-from abc import ABCMeta, abstractmethod
-from collections import namedtuple
-from collections.abc import Sequence
+from typing import Any
 
 import awkward
+import boost_histogram.axis as bha
 import cupy
+import hist
 import numpy as np
 
 from cuda_histogram.axis import (
-    Axis,
-    Bin,
-    Cat,
-    DenseAxis,
-    Interval,
-    SparseAxis,
     _overflow_behavior,
 )
 
 __all__: list[str] = ["Hist"]
 
-_MaybeSumSlice = namedtuple("_MaybeSumSlice", ["start", "stop", "sum"])
 
-
-def _assemble_blocks(array, ndslice, depth=0):
-    """
-    Turns an n-dimensional slice of array (tuple of slices)
-     into a nested list of numpy arrays that can be passed to np.block()
-
-    Under the assumption that index 0 of any dimension is underflow, -2 overflow, -1 nanflow,
-     this function will add the range not in the slice to the appropriate (over/under)flow bins
+class Hist(hist.Hist):
     """
-    if depth == 0:
-        ndslice = [_MaybeSumSlice(s.start, s.stop, False) for s in ndslice]
-    if depth == len(ndslice):
-        slice_op = tuple(slice(s.start, s.stop) for s in ndslice)
-        sum_op = tuple(i for i, s in enumerate(ndslice) if s.sum)
-        return array[slice_op].sum(axis=sum_op, keepdims=True)
-    slist = []
-    newslice = ndslice[:]
-    if ndslice[depth].start is not None:
-        newslice[depth] = _MaybeSumSlice(None, ndslice[depth].start, True)
-        slist.append(_assemble_blocks(array, newslice, depth + 1))
-    newslice[depth] = _MaybeSumSlice(ndslice[depth].start, ndslice[depth].stop, False)
-    slist.append(_assemble_blocks(array, newslice, depth + 1))
-    if ndslice[depth].stop is not None:
-        newslice[depth] = _MaybeSumSlice(ndslice[depth].stop, -1, True)
-        slist.append(_assemble_blocks(array, newslice, depth + 1))
-        newslice[depth] = _MaybeSumSlice(-1, None, False)
-        slist.append(_assemble_blocks(array, newslice, depth + 1))
-    return slist
-
-
-class AccumulatorABC(metaclass=ABCMeta):
-    """Abstract base class for an accumulator
-
-    Accumulators are abstract objects that enable the reduce stage of the typical map-reduce
-    scaleout that we do in Coffea. One concrete example is a histogram. The idea is that an
-    accumulator definition holds enough information to be able to create an empty accumulator
-    (the ``identity()`` method) and add two compatible accumulators together (the ``add()`` method).
-    The former is not strictly necessary, but helps with book-keeping. Here we show an example usage
-    of a few accumulator types. An arbitrary-depth nesting of dictionary accumulators is supported, much
-    like the behavior of directories in ROOT hadd.
-
-    After defining an accumulator::
-
-        from coffea.processor import dict_accumulator, column_accumulator, defaultdict_accumulator
-        from cuda_histogram import Hist, Bin
-        import numpy as np
-
-        adef = dict_accumulator({
-            'cutflow': defaultdict_accumulator(int),
-            'pt': Hist("counts", Bin("pt", "$p_T$", 100, 0, 100)),
-            'final_pt': column_accumulator(np.zeros(shape=(0,))),
-        })
-
-    Notice that this function does not mutate ``adef``::
-
-        def fill(n):
-            ptvals = np.random.exponential(scale=30, size=n)
-            cut = ptvals > 200.
-            acc = adef.identity()
-            acc['cutflow']['pt>200'] += cut.sum()
-            acc['pt'].fill(pt=ptvals)
-            acc['final_pt'] += column_accumulator(ptvals[cut])
-            return acc
-
-    As such, we can execute it several times in parallel and reduce the result::
-
-        import concurrent.futures
-        with concurrent.futures.ThreadPoolExecutor() as executor:
-            outputs = executor.map(fill, [2000, 2000])
-
-        combined = sum(outputs, adef.identity())
-
-
-    Derived classes must implement
-        - ``identity()``: returns a new object of same type as self,
-          such that ``self + self.identity() == self``
-        - ``add(other)``: adds an object of same type as self to self
-
-    Concrete implementations are then provided for ``__add__``, ``__radd__``, and ``__iadd__``.
-    """
-
-    @abstractmethod
-    def identity(self):
-        """Identity of the accumulator
-
-        A value such that any other value added to it will return
-        the other value
-        """
-
-    @abstractmethod
-    def add(self, other):
-        """Add another accumulator to this one in-place"""
-
-    def __add__(self, other):
-        ret = self.identity()
-        ret.add(self)
-        ret.add(other)
-        return ret
+    Construct a new histogram.
 
-    def __radd__(self, other):
-        ret = self.identity()
-        ret.add(other)
-        ret.add(self)
-        return ret
-
-    def __iadd__(self, other):
-        self.add(other)
-        return self
-
-
-class Hist(AccumulatorABC):
-    """
-    Specify a multidimensional histogram.
+    If you pass in a single argument, this will be treated as a
+    histogram and this will convert the histogram to this type of
+    histogram.
 
     Parameters
     ----------
-        label : str
-            A description of the meaning of the sum of weights
-        ``*axes``
-            positional list of `Cat` or `Bin` objects, denoting the axes of the histogram
-        axes : collections.abc.Sequence
-            list of `Cat` or `Bin` objects, denoting the axes of the histogram (overridden by ``*axes``)
-        dtype : str
-            Underlying numpy dtype to use for storing sum of weights
-
-    Examples
-    --------
-
-    Creating a histogram with a sparse axis, and two dense axes::
-
-        import cuda_histogram as chist
-
-        h = chist.Hist("Observed bird count",
-                             chist.Cat("species", "Bird species"),
-                             chist.Bin("x", "x coordinate [m]", 20, -5, 5),
-                             chist.Bin("y", "y coordinate [m]", 20, -5, 5),
-                             )
-
-        # or
-
-        h = chist.Hist(label="Observed bird count",
-                             axes=(chist.Cat("species", "Bird species"),
-                                   chist.Bin("x", "x coordinate [m]", 20, -5, 5),
-                                   chist.Bin("y", "y coordinate [m]", 20, -5, 5),
-                                  )
-                             )
-
-        # or
-
-        h = chist.Hist(axes=[chist.Cat("species", "Bird species"),
-                                   chist.Bin("x", "x coordinate [m]", 20, -5, 5),
-                                   chist.Bin("y", "y coordinate [m]", 20, -5, 5),
-                                  ],
-                             label="Observed bird count",
-                             )
-
-    which produces:
-
-    >>> h
-    <Hist (species,x,y) instance at 0x10d84b550>
-
+    *args : Axis
+        Provide 1 or more axis instances.
+    storage : Storage = bh.storage.Double()  -- not implemented
+        Select a storage to use in the histogram
+    metadata : Any = None
+        Data that is passed along if a new histogram is created
+    data: np.typing.NDArray[Any] = None  -- not implemented
+        Data to be filled in the histogram
+    label: str = None
+        Histogram's label
+    name: str = None
+        Histogram's name
     """
 
-    #: Default numpy dtype to store sum of weights
-    DEFAULT_DTYPE = "d"
-
-    def __init__(self, label, *axes, **kwargs):
-        if not isinstance(label, str):
-            raise TypeError("label must be a string")
-        self._label = label
-        self._dtype = kwargs.get("dtype", Hist.DEFAULT_DTYPE)
-        self._axes = axes
-        if len(axes) == 0 and "axes" in kwargs:
-            if not isinstance(kwargs["axes"], Sequence):
-                raise TypeError("axes must be a sequence type! (tuple, list, etc.)")
-            self._axes = tuple(kwargs["axes"])
-        elif len(axes) != 0 and "axes" in kwargs:
-            warnings.warn(
-                "axes defined by both positional arguments and keyword argument, using positional arguments"
-            )
-
-        if not all(isinstance(ax, Axis) for ax in self._axes):
-            del self._axes
-            raise TypeError("All axes must be derived from Axis class")
-        # if we stably partition axes to sparse, then dense, some things simplify
-        # ..but then the user would then see the order change under them
+    def __init__(
+        self,
+        *axes,
+        storage=None,
+        metadata: Any = None,
+        data: np.typing.NDArray[Any] | None = None,
+        label: str | None = None,
+        name: str | None = None,
+    ) -> None:
+        super().__init__(
+            *axes, storage=storage, metadata=metadata, data=data, label=label, name=name
+        )
         self._dense_shape = tuple(
-            [ax.size for ax in self._axes if isinstance(ax, DenseAxis)]
+            [ax.size for ax in self.axes if isinstance(ax, (bha.Regular, bha.Variable))]
         )
-        if np.prod(self._dense_shape) > 10000000:
-            warnings.warn("Allocating a large (>10M bin) histogram!", RuntimeWarning)
-        self._sumw = {}
+        self._sumw = cupy.zeros(shape=self._dense_shape)
         # Storage of sumw2 starts at first use of weight keyword in fill()
         self._sumw2 = None
-
-    def __repr__(self):
-        return "<{} ({}) instance at 0x{:0x}>".format(
-            self.__class__.__name__,
-            ",".join(d.name for d in self.axes()),
-            id(self),
-        )
-
-    @property
-    def label(self):
-        """A label describing the meaning of the sum of weights"""
-        return self._label
-
-    @label.setter
-    def label(self, label):
-        self._label = label
-
-    def copy(self, content=True):
-        """Create a deep copy
-
-        Parameters
-        ----------
-            content : bool
-                If set false, only the histogram definition is copied, resetting
-                the sum of weights to zero
-        """
-        out = Hist(self._label, *self._axes, dtype=self._dtype)
-        if self._sumw2 is not None:
-            out._sumw2 = {}
-        if content:
-            out._sumw = copy.deepcopy(self._sumw)
-            out._sumw2 = copy.deepcopy(self._sumw2)
-        return out
-
-    def identity(self):
-        """The identity (zero value) of this accumulator"""
-        return self.copy(content=False)
-
-    def clear(self):
-        """Clear all content in this histogram"""
-        self._sumw = {}
-        self._sumw2 = None
-
-    def axis(self, axis_name):
-        """Get an ``Axis`` object"""
-        if axis_name in self._axes:
-            return self._axes[self._axes.index(axis_name)]
-        raise KeyError(f"No axis {axis_name} found in {self!r}")
-
-    def axes(self):
-        """Get all axes in this histogram"""
-        return self._axes
-
-    @property
-    def fields(self):
-        """This is a stub for histbook compatibility"""
-        return [ax.name for ax in self._axes]
-
-    def dim(self):
-        """Dimension of this histogram (number of axes)"""
-        return len(self._axes)
+        self._overflows = cupy.array(0)
+        self._underflows = cupy.array(0)
 
     def dense_dim(self):
         """Dense dimension of this histogram (number of non-sparse axes)"""
         return len(self._dense_shape)
 
-    def sparse_dim(self):
-        """Sparse dimension of this histogram (number of sparse axes)"""
-        return self.dim() - self.dense_dim()
-
-    def dense_axes(self):
-        """All dense axes"""
-        return [ax for ax in self._axes if isinstance(ax, DenseAxis)]
-
-    def sparse_axes(self):
-        """All sparse axes"""
-        return [ax for ax in self._axes if isinstance(ax, SparseAxis)]
-
-    def sparse_nbins(self):
-        """Total number of sparse bins"""
-        return len(self._sumw)
-
-    def _idense(self, axis):
-        return self.dense_axes().index(axis)
-
-    def _isparse(self, axis):
-        return self.sparse_axes().index(axis)
-
     def _init_sumw2(self):
-        self._sumw2 = {}
-        for key in self._sumw:
-            self._sumw2[key] = self._sumw[key].copy()
-
-    def compatible(self, other):
-        """Checks if this histogram is compatible with another, i.e. they have identical binning"""
-        if self.dim() != other.dim():
-            return False
-        if {d.name for d in self.sparse_axes()} != {
-            d.name for d in other.sparse_axes()
-        }:
-            return False
-        if not all(d1 == d2 for d1, d2 in zip(self.dense_axes(), other.dense_axes())):  # noqa: SIM103
-            return False
-        return True
-
-    def add(self, other):
-        """Add another histogram into this one, in-place"""
-        if not self.compatible(other):
-            raise ValueError(
-                f"Cannot add this histogram with histogram {other!r} of dissimilar dimensions"
-            )
-
-        raxes = other.sparse_axes()
-
-        def add_dict(left, right):
-            for rkey in right:
-                lkey = tuple(
-                    self.axis(rax).index(rax[ridx]) for rax, ridx in zip(raxes, rkey)
-                )
-                if lkey in left:
-                    left[lkey] += right[rkey]
-                else:
-                    left[lkey] = copy.deepcopy(right[rkey])
-
-        if self._sumw2 is None and other._sumw2 is None:
-            pass
-        elif self._sumw2 is None:
-            self._init_sumw2()
-            add_dict(self._sumw2, other._sumw2)
-        elif other._sumw2 is None:
-            add_dict(self._sumw2, other._sumw)
-        else:
-            add_dict(self._sumw2, other._sumw2)
-        add_dict(self._sumw, other._sumw)
-        return self
+        self._sumw2 = cupy.zeros(shape=self._dense_shape)
 
     def __getitem__(self, keys):
-        if not isinstance(keys, tuple):
-            keys = (keys,)
-        if len(keys) > self.dim():
-            raise IndexError("Too many indices for this histogram")
-        elif len(keys) < self.dim():
-            if Ellipsis in keys:
-                idx = keys.index(Ellipsis)
-                slices = (slice(None),) * (self.dim() - len(keys) + 1)
-                keys = keys[:idx] + slices + keys[idx + 1 :]
-            else:
-                slices = (slice(None),) * (self.dim() - len(keys))
-                keys += slices
-        sparse_idx = []
-        dense_idx = []
-        new_dims = []
-        for s, ax in zip(keys, self._axes):
-            if isinstance(ax, SparseAxis):
-                sparse_idx.append(ax._ireduce(s))
-                new_dims.append(ax)
-            else:
-                islice = ax._ireduce(s)
-                dense_idx.append(islice)
-                new_dims.append(ax.reduced(islice))
-        dense_idx = tuple(dense_idx)
-
-        def dense_op(array):
-            as_numpy = array.get()
-            blocked = np.block(_assemble_blocks(as_numpy, dense_idx))
-            return cupy.asarray(blocked)
-
-        out = Hist(self._label, *new_dims, dtype=self._dtype)
-        if self._sumw2 is not None:
-            out._init_sumw2()
-        for sparse_key in self._sumw:
-            if not all(k in idx for k, idx in zip(sparse_key, sparse_idx)):
-                continue
-            if sparse_key in out._sumw:
-                out._sumw[sparse_key] += dense_op(self._sumw[sparse_key])
-                if self._sumw2 is not None:
-                    out._sumw2[sparse_key] += dense_op(self._sumw2[sparse_key])
-            else:
-                out._sumw[sparse_key] = dense_op(self._sumw[sparse_key]).copy()
-                if self._sumw2 is not None:
-                    out._sumw2[sparse_key] = dense_op(self._sumw2[sparse_key]).copy()
-        return out
+        if isinstance(keys, int):
+            return self._sumw[keys]
+        else:
+            raise ValueError("Convert the histogram to CPU to access full UHI")
 
-    def fill(self, **values):
-        """Fill sum of weights from columns
+    def fill(self, *args, weight=None):
+        """
+        Insert data into the histogram.
 
         Parameters
         ----------
-            ``**values``
-                Keyword arguments, one for each axis name, of either flat numpy arrays
-                (for dense dimensions) or literals (for sparse dimensions) which will
-                be used to fill bins at the corresponding indices.
-
-        Note
-        ----
-            The reserved keyword ``weight``, if specified, will increment sum of weights
-            by the given column values, which must be broadcastable to the same dimension as all other
-            columns.  Upon first use, this will trigger the storage of the sum of squared weights.
-
-
-        Examples
-        --------
-
-        Filling the histogram from the `Hist` example:
-
-        >>> h.fill(species='ducks', x=np.random.normal(size=10), y=np.random.normal(size=10), weight=np.ones(size=10) * 3)
-
+        *args : Union[Array[float], Array[int], Array[str], float, int, str]  -- only arrays of numbers supported
+            Provide one value or array per dimension
+        weight : List[Union[Array[float], Array[int], float, int, str]]]  -- not supported
+            Provide weights (only if the histogram storage supports it)
         """
-        weight = values.pop("weight", None)
         if isinstance(weight, (awkward.Array, cupy.ndarray, np.ndarray)):
             weight = cupy.array(weight)
         if isinstance(weight, numbers.Number):
             weight = cupy.atleast_1d(weight)
-        if not all(d.name in values for d in self._axes):
-            missing = ", ".join(d.name for d in self._axes if d.name not in values)
-            raise ValueError(
-                f"Not all axes specified for {self!r}.  Missing: {missing}"
-            )
-        if not all(name in self._axes for name in values):
-            extra = ", ".join(name for name in values if name not in self._axes)
-            raise ValueError(
-                f"Unrecognized axes specified for {self!r}.  Extraneous: {extra}"
+        if not isinstance(args, str) and len(args) != len(self.axes):
+            raise TypeError(
+                f"Cannot fill {len(self.axis)} axes with {len(args)} arrays."
             )
 
         if weight is not None and self._sumw2 is None:
             self._init_sumw2()
 
-        sparse_key = tuple(d.index(values[d.name]) for d in self.sparse_axes())
-        if sparse_key not in self._sumw:
-            self._sumw[sparse_key] = cupy.zeros(
-                shape=self._dense_shape, dtype=self._dtype
-            )
-            if self._sumw2 is not None:
-                self._sumw2[sparse_key] = cupy.zeros(
-                    shape=self._dense_shape, dtype=self._dtype
-                )
-
         if self.dense_dim() > 0:
+            self._overflows = tuple(
+                sum(value > d.edges[-1])
+                for d, value in zip(self.axes, args)
+                if isinstance(d, (bha.Regular, bha.Variable))
+            )
+            self._underflows = tuple(
+                sum(value < d.edges[0])
+                for d, value in zip(self.axes, args)
+                if isinstance(d, (bha.Regular, bha.Variable))
+            )
             dense_indices = tuple(
-                cupy.asarray(d.index(values[d.name]))
-                for d in self._axes
-                if isinstance(d, DenseAxis)
+                cupy.asarray(d.index(value))[
+                    (value > d.edges[0]) & (value < d.edges[-1])
+                ]
+                for d, value in zip(self.axes, args)
+                if isinstance(d, (bha.Regular, bha.Variable))
             )
             xy = cupy.atleast_1d(
                 cupy.ravel_multi_index(dense_indices, self._dense_shape)
             )
             if weight is not None:
-                self._sumw[sparse_key][:] += cupy.bincount(
+                self._sumw[:] += cupy.bincount(
                     xy, weights=weight, minlength=np.array(self._dense_shape).prod()
                 ).reshape(self._dense_shape)
-                self._sumw2[sparse_key][:] += cupy.bincount(
+                self._sumw2[:] += cupy.bincount(
                     xy,
                     weights=weight**2,
                     minlength=np.array(self._dense_shape).prod(),
                 ).reshape(self._dense_shape)
             else:
-                self._sumw[sparse_key][:] += cupy.bincount(
+                self._sumw[:] += cupy.bincount(
                     xy, weights=None, minlength=np.array(self._dense_shape).prod()
                 ).reshape(self._dense_shape)
                 if self._sumw2 is not None:
-                    self._sumw2[sparse_key][:] += cupy.bincount(
+                    self._sumw2[:] += cupy.bincount(
                         xy,
                         weights=None,
                         minlength=np.array(self._dense_shape).prod(),
                     ).reshape(self._dense_shape)
         elif weight is not None:
-            self._sumw[sparse_key] += cupy.sum(weight)
-            self._sumw2[sparse_key] += cupy.sum(weight**2)
+            self._sumw += cupy.sum(weight)
+            self._sumw2 += cupy.sum(weight**2)
         else:
-            self._sumw[sparse_key] += 1.0
+            self._sumw += 1.0
             if self._sumw2 is not None:
-                self._sumw2[sparse_key] += 1.0
-
-    def sum(self, *axes, **kwargs):
-        """Integrates out a set of axes, producing a new histogram
-
-        Parameters
-        ----------
-            ``*axes``
-                Positional list of axes to integrate out (either a string or an Axis object)
-
-            overflow : {'none', 'under', 'over', 'all', 'allnan'}, optional
-                How to treat the overflow bins in the sum.  Only applies to dense axes.
-                'all' includes both under- and over-flow but not nan-flow bins.
-                Default is 'none'.
-        """
-        overflow = kwargs.pop("overflow", "none")
-        axes = [self.axis(ax) for ax in axes]
-        reduced_dims = [ax for ax in self._axes if ax not in axes]
-        out = Hist(self._label, *reduced_dims, dtype=self._dtype)
-        if self._sumw2 is not None:
-            out._init_sumw2()
-
-        sparse_drop = []
-        dense_slice = [slice(None)] * self.dense_dim()
-        dense_sum_dim = []
-        for axis in axes:
-            if isinstance(axis, DenseAxis):
-                idense = self._idense(axis)
-                dense_sum_dim.append(idense)
-                dense_slice[idense] = _overflow_behavior(overflow)
-            elif isinstance(axis, SparseAxis):
-                isparse = self._isparse(axis)
-                sparse_drop.append(isparse)
-        dense_slice = tuple(dense_slice)
-        dense_sum_dim = tuple(dense_sum_dim)
-
-        def dense_op(array):
-            if len(dense_sum_dim) > 0:
-                return np.sum(array[dense_slice], axis=dense_sum_dim)
-            return array
-
-        for key in self._sumw:
-            new_key = tuple(k for i, k in enumerate(key) if i not in sparse_drop)
-            if new_key in out._sumw:
-                out._sumw[new_key] += dense_op(self._sumw[key])
-                if self._sumw2 is not None:
-                    out._sumw2[new_key] += dense_op(self._sumw2[key])
-            else:
-                out._sumw[new_key] = dense_op(self._sumw[key]).copy()
-                if self._sumw2 is not None:
-                    out._sumw2[new_key] = dense_op(self._sumw2[key]).copy()
-        return out
-
-    def project(self, *axes, **kwargs):
-        """Project histogram onto a subset of its axes
-
-        Parameters
-        ----------
-            ``*axes`` : str or Axis
-                Positional list of axes to project on to
-            overflow : str
-                Controls behavior of integration over remaining axes.
-                See `sum` description for meaning of allowed values
-                Default is to *not include* overflow bins
-        """
-        overflow = kwargs.pop("overflow", "none")
-        axes = [self.axis(ax) for ax in axes]
-        toremove = [ax for ax in self.axes() if ax not in axes]
-        return self.sum(*toremove, overflow=overflow)
-
-    def integrate(self, axis_name, int_range=None, overflow="none"):
-        """Integrates current histogram along one dimension
-
-        Parameters
-        ----------
-            axis_name : str or Axis
-                Which dimension to reduce on
-            int_range : slice
-                Any slice, list, string, or other object that the axis will understand
-                Default is to integrate over the whole range
-            overflow : str
-                See `sum` description for meaning of allowed values
-                Default is to *not include* overflow bins
-
-        """
-        if int_range is None:
-            int_range = slice(None)
-        axis = self.axis(axis_name)
-        full_slice = tuple(
-            slice(None) if ax != axis else int_range for ax in self._axes
-        )
-        if isinstance(int_range, Interval):
-            # Handle overflow intervals nicely
-            if int_range.nan():
-                overflow = "justnan"
-            elif int_range.lo == -np.inf:
-                overflow = "under"
-            elif int_range.hi == np.inf:
-                overflow = "over"
-        return self[full_slice].sum(
-            axis.name, overflow=overflow
-        )  # slice may make new axis, use name
-
-    def remove(self, bins, axis):
-        """Remove bins from a sparse axis
-
-        Parameters
-        ----------
-            bins : iterable
-                A list of bin identifiers to remove
-            axis : str or Axis
-                Axis name or SparseAxis instance
-
-        Returns a *copy* of the histogram with specified bins removed, not an in-place operation
-        """
-        axis = self.axis(axis)
-        if not isinstance(axis, SparseAxis):
-            raise NotImplementedError(
-                "Hist.remove() only supports removing items from a sparse axis."
-            )
-        bins = [axis.index(binid) for binid in bins]
-        keep = [binid.name for binid in self.identifiers(axis) if binid not in bins]
-        full_slice = tuple(slice(None) if ax != axis else keep for ax in self._axes)
-        return self[full_slice]
-
-    def group(self, old_axes, new_axis, mapping, overflow="none"):
-        """Group a set of slices on old axes into a single new axis
-
-        Parameters
-        ----------
-            old_axes
-                Axis or tuple of axes which are being grouped
-            new_axis
-                A new sparse dimension definition, e.g. a `Cat` instance
-            mapping : dict
-                A mapping ``{'new_bin': (slice, ...), ...}`` where each
-                slice is on the axes being re-binned.  In the case of
-                a single axis for ``old_axes``, ``{'new_bin': slice, ...}``
-                is admissible.
-            overflow : str
-                See `sum` description for meaning of allowed values
-                Default is to *not include* overflow bins
-
-        Returns a new histogram object
-        """
-        if not isinstance(new_axis, SparseAxis):
-            raise TypeError(
-                "New axis must be a sparse axis.  Note: Hist.group() signature has changed to group(old_axes, new_axis, ...)!"
-            )
-        if new_axis in self.axes() and self.axis(new_axis) is new_axis:
-            raise RuntimeError(
-                "new_axis is already in the list of axes.  Note: Hist.group() signature has changed to group(old_axes, new_axis, ...)!"
-            )
-        if not isinstance(old_axes, tuple):
-            old_axes = (old_axes,)
-        old_axes = [self.axis(ax) for ax in old_axes]
-        old_indices = [i for i, ax in enumerate(self._axes) if ax in old_axes]
-        new_dims = [new_axis] + [ax for ax in self._axes if ax not in old_axes]
-        out = Hist(self._label, *new_dims, dtype=self._dtype)
-        if self._sumw2 is not None:
-            out._init_sumw2()
-        for new_cat in mapping:
-            the_slice = mapping[new_cat]
-            if not isinstance(the_slice, tuple):
-                the_slice = (the_slice,)
-            if len(the_slice) != len(old_axes):
-                raise Exception("Slicing does not match number of axes being rebinned")
-            full_slice = [slice(None)] * self.dim()
-            for idx, s in zip(old_indices, the_slice):
-                full_slice[idx] = s
-            full_slice = tuple(full_slice)
-            reduced_hist = self[full_slice].sum(
-                *tuple(ax.name for ax in old_axes), overflow=overflow
-            )  # slice may change old axis binning
-            new_idx = new_axis.index(new_cat)
-            for key in reduced_hist._sumw:
-                new_key = (new_idx, *key)
-                out._sumw[new_key] = reduced_hist._sumw[key]
-                if self._sumw2 is not None:
-                    out._sumw2[new_key] = reduced_hist._sumw2[key]
-        return out
-
-    def rebin(self, old_axis, new_axis):
-        """Rebin a dense axis
-
-        This function will construct the mapping from old to new axis, and
-        constructs a new histogram, rebinning the sum of weights along that dimension.
-
-        Note
-        ----
-        No interpolation is performed, so the user must be sure the old
-        and new axes have compatible bin boundaries, e.g. that they evenly
-        divide each other.
+                self._sumw2 += 1.0
 
-        Parameters
-        ----------
-            old_axis : str or Axis
-                Axis to rebin
-            new_axis : str or Axis or int
-                A DenseAxis object defining the new axis (e.g. a `Bin` instance).
-                If a number N is supplied, the old axis edges are downsampled by N,
-                resulting in a histogram with ``old_nbins // N`` bins.
-
-        Returns a new `Hist` object.
+    def values(self, flow: bool = False):
         """
-        old_axis = self.axis(old_axis)
-        if isinstance(new_axis, numbers.Integral):
-            new_axis = Bin(old_axis.name, old_axis.label, old_axis.edges()[::new_axis])
-        new_dims = [ax if ax != old_axis else new_axis for ax in self._axes]
-        out = Hist(self._label, *new_dims, dtype=self._dtype)
-        if self._sumw2 is not None:
-            out._init_sumw2()
-
-        # would have been nice to use ufunc.reduceat, but we should support arbitrary reshuffling
-        idense = self._idense(old_axis)
-
-        def view_ax(idx):
-            fullindex = [slice(None)] * self.dense_dim()
-            fullindex[idense] = idx
-            return tuple(fullindex)
-
-        binmap = [new_axis.index(i) for i in old_axis.identifiers(overflow="allnan")]
-
-        def dense_op(array):
-            anew = np.zeros(out._dense_shape, dtype=out._dtype)
-            for iold, inew in enumerate(binmap):
-                anew[view_ax(inew)] += array[view_ax(iold)]
-            return anew
-
-        for key in self._sumw:
-            out._sumw[key] = dense_op(self._sumw[key])
-            if self._sumw2 is not None:
-                out._sumw2[key] = dense_op(self._sumw2[key])
-        return out
-
-    def values(self, sumw2=False, overflow="none"):
-        """Extract the sum of weights arrays from this histogram
+        Return the values in histogram.
 
         Parameters
         ----------
-            sumw2 : bool
-                If True, frequencies is a tuple of arrays (sum weights, sum squared weights)
-            overflow
-                See `sum` description for meaning of allowed values
-
-        Returns a mapping ``{(sparse identifier, ...): np.array(...), ...}``
-        where each array has dimension `dense_dim` and shape matching
-        the number of bins per axis, plus 0-3 overflow bins depending
-        on the ``overflow`` argument.
+            flow : bool
+                Include flow bins.
         """
 
         def view_dim(arr):
@@ -746,167 +160,12 @@ def view_dim(arr):
                 return arr
             else:
                 return arr[
-                    tuple(_overflow_behavior(overflow) for _ in range(self.dense_dim()))
+                    tuple(_overflow_behavior(flow) for _ in range(self.dense_dim()))
                 ]
 
-        out = {}
-        for sparse_key in self._sumw:
-            id_key = tuple(ax[k] for ax, k in zip(self.sparse_axes(), sparse_key))
-            if sumw2:
-                if self._sumw2 is not None:
-                    w2 = view_dim(self._sumw2[sparse_key])
-                else:
-                    w2 = view_dim(self._sumw[sparse_key])
-                out[id_key] = (view_dim(self._sumw[sparse_key]), w2)
-            else:
-                out[id_key] = view_dim(self._sumw[sparse_key])
-        return out
-
-    def scale(self, factor, axis=None):
-        """Scale histogram in-place by factor
-
-        Parameters
-        ----------
-            factor : float or dict
-                A number or mapping of identifier to number
-            axis : optional
-                Which (sparse) axis the dict applies to, may be a tuples of axes.
-                The dict keys must follow the same structure.
-
-        Examples
-        --------
-        This function is useful to quickly reweight according to some
-        weight mapping along a sparse axis, such as the ``species`` axis
-        in the `Hist` example:
-
-        >>> h.scale({'ducks': 0.3, 'geese': 1.2}, axis='species')
-        >>> h.scale({('ducks',): 0.5}, axis=('species',))
-        >>> h.scale({('geese', 'honk'): 5.0}, axis=('species', 'vocalization'))
-        """
-        if self._sumw2 is None:
-            self._init_sumw2()
-        if isinstance(factor, numbers.Number) and axis is None:
-            for key in self._sumw:
-                self._sumw[key] *= factor
-                self._sumw2[key] *= factor**2
-        elif isinstance(factor, dict):
-            if not isinstance(axis, tuple):
-                axis = (axis,)
-                factor = {(k,): v for k, v in factor.items()}
-            axis = tuple(map(self.axis, axis))
-            isparse = list(map(self._isparse, axis))
-            factor = {
-                tuple(a.index(e) for a, e in zip(axis, k)): v for k, v in factor.items()
-            }
-            for key in self._sumw:
-                factor_key = tuple(key[i] for i in isparse)
-                if factor_key in factor:
-                    self._sumw[key] *= factor[factor_key]
-                    self._sumw2[key] *= factor[factor_key] ** 2
-        elif isinstance(factor, np.ndarray):
-            axis = self.axis(axis)
-            raise NotImplementedError("Scale dense dimension by a factor")
-        else:
-            raise TypeError("Could not interpret scale factor")
-
-    def identifiers(self, axis, overflow="none"):
-        """Return a list of identifiers for an axis
-
-        Parameters
-        ----------
-            axis
-                Axis name or Axis object
-            overflow
-                See `sum` description for meaning of allowed values
-        """
-        axis = self.axis(axis)
-        if isinstance(axis, SparseAxis):  # noqa: RET503
-            out = []
-            isparse = self._isparse(axis)
-            for identifier in axis.identifiers():
-                if any(k[isparse] == axis.index(identifier) for k in self._sumw):
-                    out.append(identifier)
-            if axis.sorting == "integral":
-                hproj = {
-                    key[0]: integral
-                    for key, integral in self.project(axis).values().items()
-                }
-                out.sort(key=lambda k: hproj[k.name])
-            return out
-        elif isinstance(axis, DenseAxis):
-            return axis.identifiers(overflow=overflow)
-
-    def to_boost(self):
-        """Convert this cuda_histogram object to a boost_histogram object"""
-        import boost_histogram
-
-        newaxes = []
-        for axis in self.axes():
-            if isinstance(axis, Bin) and axis._uniform:
-                newaxis = boost_histogram.axis.Regular(
-                    axis._bins,
-                    axis._lo,
-                    axis._hi,
-                    underflow=True,
-                    overflow=True,
-                )
-                newaxis.name = axis.name
-                newaxis.label = axis.label
-                newaxes.append(newaxis)
-            elif isinstance(axis, Bin) and not axis._uniform:
-                newaxis = boost_histogram.axis.Variable(
-                    axis.edges(),
-                    underflow=True,
-                    overflow=True,
-                )
-                newaxis.name = axis.name
-                newaxis.label = axis.label
-                newaxes.append(newaxis)
-            elif isinstance(axis, Cat):
-                identifiers = self.identifiers(axis)
-                newaxis = boost_histogram.axis.StrCategory(
-                    [x.name for x in identifiers],
-                    growth=True,
-                )
-                newaxis.name = axis.name
-                newaxis.label = axis.label
-                newaxis.bin_labels = [x.label for x in identifiers]
-                newaxes.append(newaxis)
-
-        if self._sumw2 is None:
-            storage = boost_histogram.storage.Double()
-        else:
-            storage = boost_histogram.storage.Weight()
-
-        out = boost_histogram.Histogram(*newaxes, storage=storage)
-        out.label = self.label
-
-        def expandkey(key):
-            kiter = iter(key)
-            for ax in newaxes:
-                if isinstance(ax, boost_histogram.axis.StrCategory):
-                    yield ax.index(next(kiter))
-                else:
-                    yield slice(None)
-
-        if self._sumw2 is None:
-            values = self.values(overflow="all")
-            for sparse_key, sumw in values.items():
-                index = tuple(expandkey(sparse_key))
-                view = out.view(flow=True)
-                view[index] = sumw.get()
-        else:
-            values = self.values(sumw2=True, overflow="all")
-            for sparse_key, (sumw, sumw2) in values.items():
-                index = tuple(expandkey(sparse_key))
-                view = out.view(flow=True)
-                view[index].value = sumw.get()
-                view[index].variance = sumw2.get()
-
-        return out
-
-    def to_hist(self):
-        """Convert this cuda_histogram object to a hist object"""
-        import hist
+        return view_dim(
+            cupy.append(cupy.append(self._underflows, self._sumw), self._overflows)
+        )
 
-        return hist.Hist(self.to_boost())
+    def to_cpu(self):
+        return hist.Hist(self, data=self._sumw.get())
diff --git a/tests/test_hist_tools.py b/tests/test_hist_tools.py
index a15da9b..2d9026d 100644
--- a/tests/test_hist_tools.py
+++ b/tests/test_hist_tools.py
@@ -1,6 +1,5 @@
 from __future__ import annotations
 
-import awkward as ak
 import numpy as np
 import pytest
 
@@ -243,135 +242,44 @@ def test_hist():
     assert h_less.sum("vocalization", "height", "mass", "animal").values()[()] == 1004.0
 
 
-def test_hist_serdes():
-    import pickle
-
-    h_regular_bins = cuda_histogram.Hist(
-        "regular joe",
-        cuda_histogram.axis.Bin("x", "x", 20, 0, 200),
-        cuda_histogram.axis.Bin("y", "why", 20, -3, 3),
-    )
-
-    h_regular_bins.fill(
-        x=np.array([1.0, 2.0, 3.0, 4.0, 5.0]), y=np.array([-2.0, 1.0, 0.0, 1.0, 2.0])
-    )
-
-    h_regular_bins.sum("x").identifiers("y")
-
-    spkl = pickle.dumps(h_regular_bins)
-
-    hnew = pickle.loads(spkl)
-
-    hnew.sum("x").identifiers("y")
-
-    assert h_regular_bins._dense_shape == hnew._dense_shape
-    assert h_regular_bins._axes == hnew._axes
-
-
-def test_hist_serdes_labels():
-    import pickle
-
-    ax = cuda_histogram.axis.Bin("asdf", "asdf", 3, 0, 3)
-    ax.identifiers()[0].label = "type 1"
-    h = cuda_histogram.Hist("a", ax)
-    h.identifiers("asdf")
-
-    spkl = pickle.dumps(h)
-
-    hnew = pickle.loads(spkl)
-
-    for old, new in zip(h.identifiers("asdf"), hnew.identifiers("asdf")):
-        assert old.label == new.label
-
-    assert h._dense_shape == hnew._dense_shape
-    assert h._axes == hnew._axes
-
-
-def test_issue_247():
-    import cuda_histogram
-
-    h = cuda_histogram.Hist("stuff", cuda_histogram.axis.Bin("old", "old", 20, -1, 1))
-    h.fill(old=h.axis("old").centers())
-    h2 = h.rebin(h.axis("old"), cuda_histogram.axis.Bin("new", "new", 10, -1, 1))
-    # check first if its even possible to have correct binning
-    assert np.all(h2.axis("new").edges() == h.axis("old").edges()[::2])
-    # make sure the lookup works properly
-    assert np.all(h2.values()[()] == 2.0)
-    h3 = h.rebin(h.axis("old"), 2)
-    assert np.all(h3.values()[()] == 2.0)
-
-    with pytest.raises(ValueError):
-        # invalid division
-        _ = h.rebin(h.axis("old"), cuda_histogram.axis.Bin("new", "new", 8, -1, 1))
-
-    newaxis = cuda_histogram.axis.Bin(
-        "new", "new", h.axis("old").edges()[np.cumsum([0, 2, 3, 5])]
-    )
-    h.rebin("old", newaxis)
-
-
-def test_issue_333():
-    axis = cuda_histogram.axis.Bin("channel", "Channel b1", 50, 0, 2000)
-    temp = np.arange(0, 2000, 40, dtype=np.int16)
-    assert np.all(axis.index(temp).get() == np.arange(50) + 1)
-
-
-def test_issue_394():
-    dummy = cuda_histogram.Hist(
-        "Dummy",
-        cuda_histogram.axis.Cat("sample", "sample"),
-        cuda_histogram.axis.Bin("dummy", "Number of events", 1, 0, 1),
-    )
-    dummy.fill(sample="test", dummy=1, weight=0.5)
-
-
-def test_fill_none():
-    dummy = cuda_histogram.Hist("Dummy", cuda_histogram.axis.Bin("x", "asdf", 1, 0, 1))
-    with pytest.raises(ValueError):
-        # attempt to fill with none
-        dummy.fill(x=ak.Array([0.1, None, 0.3]))
-
-    # allow fill when masked type but no Nones remain
-    dummy.fill(x=ak.Array([0.1, None, 0.3])[[True, False, True]])
-
-
-def test_boost_conversion():
-    import boost_histogram as bh
-
-    dummy = cuda_histogram.Hist(
-        "Dummy",
-        cuda_histogram.axis.Cat("sample", "sample"),
-        cuda_histogram.axis.Bin("dummy", "Number of events", 1, 0, 1),
-    )
-    dummy.fill(sample="test", dummy=1, weight=0.5)
-    dummy.fill(sample="test", dummy=0.1)
-    dummy.fill(sample="test2", dummy=-0.1)
-    dummy.fill(sample="test3", dummy=0.5, weight=0.1)
-    dummy.fill(sample="test3", dummy=0.5, weight=0.9)
-
-    h = dummy.to_boost()
-    assert len(h.axes) == 2
-    assert h[bh.loc("test"), bh.loc(1)].value == 0.5
-    assert h[bh.loc("test"), bh.loc(100)].value == 0.5
-    assert h[bh.loc("test"), bh.loc(1)].variance == 0.25
-    assert h[0, 0].value == 1.0
-    assert h[0, 0].variance == 1.0
-    assert h[1, 0].value == 0.0
-    assert h[bh.loc("test2"), 0].value == 0.0
-    assert h[1, bh.underflow].value == 1.0
-    assert h[bh.loc("test3"), bh.loc(0.5)].value == 1.0
-    assert h[bh.loc("test3"), bh.loc(0.5)].variance == 0.1 * 0.1 + 0.9 * 0.9
-
-    dummy = cuda_histogram.Hist(
-        "Dummy",
-        cuda_histogram.axis.Cat("sample", "sample"),
-        cuda_histogram.axis.Bin("dummy", "Number of events", 1, 0, 1),
-    )
-    dummy.fill(sample="test", dummy=0.1)
-    dummy.fill(sample="test", dummy=0.2)
-    dummy.fill(sample="test2", dummy=0.2)
-    # No sumw2 -> simple bh storage
-    h = dummy.to_boost()
-    assert len(h.axes) == 2
-    assert h[0, 0] == 2.0
-    assert h[1, 0] == 1.0
+# should be a to_cpu test
+# def test_boost_conversion():
+#     import boost_histogram as bh
+
+#     dummy = cuda_histogram.Hist(
+#         "Dummy",
+#         cuda_histogram.Cat("sample", "sample"),
+#         cuda_histogram.Bin("dummy", "Number of events", 1, 0, 1),
+#     )
+#     dummy.fill(sample="test", dummy=1, weight=0.5)
+#     dummy.fill(sample="test", dummy=0.1)
+#     dummy.fill(sample="test2", dummy=-0.1)
+#     dummy.fill(sample="test3", dummy=0.5, weight=0.1)
+#     dummy.fill(sample="test3", dummy=0.5, weight=0.9)
+
+#     h = dummy.to_boost()
+#     assert len(h.axes) == 2
+#     assert h[bh.loc("test"), bh.loc(1)].value == 0.5
+#     assert h[bh.loc("test"), bh.loc(100)].value == 0.5
+#     assert h[bh.loc("test"), bh.loc(1)].variance == 0.25
+#     assert h[0, 0].value == 1.0
+#     assert h[0, 0].variance == 1.0
+#     assert h[1, 0].value == 0.0
+#     assert h[bh.loc("test2"), 0].value == 0.0
+#     assert h[1, bh.underflow].value == 1.0
+#     assert h[bh.loc("test3"), bh.loc(0.5)].value == 1.0
+#     assert h[bh.loc("test3"), bh.loc(0.5)].variance == 0.1 * 0.1 + 0.9 * 0.9
+
+#     dummy = cuda_histogram.Hist(
+#         "Dummy",
+#         cuda_histogram.Cat("sample", "sample"),
+#         cuda_histogram.Bin("dummy", "Number of events", 1, 0, 1),
+#     )
+#     dummy.fill(sample="test", dummy=0.1)
+#     dummy.fill(sample="test", dummy=0.2)
+#     dummy.fill(sample="test2", dummy=0.2)
+#     # No sumw2 -> simple bh storage
+#     h = dummy.to_boost()
+#     assert len(h.axes) == 2
+#     assert h[0, 0] == 2.0
+#     assert h[1, 0] == 1.0