From 64d2804b73c19e7d1b348d8e3dc460c9fe1ee946 Mon Sep 17 00:00:00 2001
From: Wan-Qing Yu <wanqing.yu@alleninstitute.org>
Date: Fri, 9 May 2025 12:56:00 -0700
Subject: [PATCH 1/6] disable post-processing

---
 igneous/tasks/skeleton.py | 25 +++++++++++++------------
 1 file changed, 13 insertions(+), 12 deletions(-)

diff --git a/igneous/tasks/skeleton.py b/igneous/tasks/skeleton.py
index b855921e..f3261076 100644
--- a/igneous/tasks/skeleton.py
+++ b/igneous/tasks/skeleton.py
@@ -612,10 +612,10 @@ def execute(self):
     skeletons = []
     for segid, frags in skels.items():
       skeleton = self.fuse_skeletons(frags)
-      if self.max_cable_length is None or skeleton.cable_length() <= self.max_cable_length:
-        skeleton = kimimaro.postprocess(
-          skeleton, self.dust_threshold, self.tick_threshold
-        )
+      # if self.max_cable_length is None or skeleton.cable_length() <= self.max_cable_length:
+      #   skeleton = kimimaro.postprocess(
+      #     skeleton, self.dust_threshold, self.tick_threshold
+      #   )
       skeleton.id = segid
       skeletons.append(skeleton)
 
@@ -760,14 +760,15 @@ def process_skeletons(self, unfused_skeletons, in_place=False):
         if attr['data_type'] == 'float32' 
       ]
       skel = skel.consolidate()
-      if self.max_cable_length is not None and skel.cable_length() > self.max_cable_length:
-        skeletons[label] = skel.to_precomputed()
-      else:
-        skeletons[label] = kimimaro.postprocess(
-          skel, 
-          dust_threshold=self.dust_threshold, # voxels 
-          tick_threshold=self.tick_threshold, # nm
-        ).to_precomputed()
+      # if self.max_cable_length is not None and skel.cable_length() > self.max_cable_length:
+      #   skeletons[label] = skel.to_precomputed()
+      # else:
+      #   skeletons[label] = kimimaro.postprocess(
+      #     skel, 
+      #     dust_threshold=self.dust_threshold, # voxels 
+      #     tick_threshold=self.tick_threshold, # nm
+      #   ).to_precomputed()
+      skeletons[label] = skel.to_precomputed()
 
     return skeletons
 

From aefdbf173acfaa8a42b65151dc6dac6acb14c4f0 Mon Sep 17 00:00:00 2001
From: Wan-Qing Yu <wanqing.yu@alleninstitute.org>
Date: Fri, 3 Oct 2025 13:35:10 -0700
Subject: [PATCH 2/6] init_working_draft

---
 igneous/task_creation/skeleton.py |   40 +-
 igneous/tasks/skeleton.py         |  276 +++++-
 igneous/tasks/skeleton_mod.py     | 1292 +++++++++++++++++++++++++++++
 igneous/tasks/skeleton_ori.py     |  914 ++++++++++++++++++++
 igneous_cli/cli.py                |    4 +-
 5 files changed, 2522 insertions(+), 4 deletions(-)
 create mode 100644 igneous/tasks/skeleton_mod.py
 create mode 100644 igneous/tasks/skeleton_ori.py

diff --git a/igneous/task_creation/skeleton.py b/igneous/task_creation/skeleton.py
index ab368ff3..4182c78d 100644
--- a/igneous/task_creation/skeleton.py
+++ b/igneous/task_creation/skeleton.py
@@ -93,6 +93,7 @@ def create_skeletonizing_tasks(
   timestamp:Optional[int] = None,
   root_ids_cloudpath:Optional[str] = None,
   cross_sectional_area_repair_sec_per_label:int = 0,
+  split_at_branches=False,
 ):
   """
   Assign tasks with one voxel overlap in a regular grid 
@@ -203,6 +204,11 @@ def create_skeletonizing_tasks(
     1: simple hole filling
     2: also fill borders in 2d on sides of image
     3: also perform a morphological closing using 3x3x3 stencil
+  
+  split_at_branches: (bool) If True, split skeleton fragments at branch points in Stage 1.
+  Surface-touching fragments get original IDs and will be merged across chunks. 
+  Interior skeletons get unique IDs and are considered finalized. 
+  This helps reduce memory usage during merge stage for complex branched structures.
   """
   assert 0 <= fill_holes <= 3, "fill_holes must be between 0 to 3 inclusive."
 
@@ -279,6 +285,16 @@ def create_skeletonizing_tasks(
   will_postprocess = bool(np.any(vol.bounds.size3() > shape))
   bounds = vol.bounds.clone()
 
+  # Calculate global chunk information
+  volume_shape = bounds.size3()
+  chunks_per_dim = np.ceil(volume_shape / shape).astype(int)
+  total_chunks = chunks_per_dim[0] * chunks_per_dim[1] * chunks_per_dim[2]
+
+  print(f"Volume shape: {volume_shape}")
+  print(f"Task shape: {shape}")
+  print(f"Chunks per dimension: {chunks_per_dim}")
+  print(f"Total chunks: {total_chunks}")
+
   # this should probably be a cloudvolume feature:
   # estimate the bounding box of an object using whatever
   # is available: meshes, skeletons, spatial index, etc
@@ -294,12 +310,23 @@ def create_skeletonizing_tasks(
       pass
 
   class SkeletonTaskIterator(FinelyDividedTaskIterator):
+    def __init__(self, bounds, shape):
+        super().__init__(bounds, shape)
+        self.chunk_index = 0  # Track current chunk
+        self.chunks_per_dim = chunks_per_dim
+        self.volume_bounds = bounds
+    
     def task(self, shape, offset):
+      # Calculate 3D chunk coordinates
+      cx = self.chunk_index % self.chunks_per_dim[0]
+      cy = (self.chunk_index // self.chunks_per_dim[0]) % self.chunks_per_dim[1]
+      cz = self.chunk_index // (self.chunks_per_dim[0] * self.chunks_per_dim[1])
+
       bbox_synapses = None
       if synapses:
         bbox_synapses = self.synapses_for_bbox(shape, offset)
 
-      return SkeletonTask(
+      task = SkeletonTask(
         cloudpath=cloudpath,
         shape=(shape + 1).clone(), # 1px overlap on the right hand side
         offset=offset.clone(),
@@ -329,7 +356,15 @@ def task(self, shape, offset):
         root_ids_cloudpath=root_ids_cloudpath,
         fill_holes=fill_holes,
         cross_sectional_area_repair_sec_per_label=int(cross_sectional_area_repair_sec_per_label),
+        # Pass chunk information
+        chunk_index=self.chunk_index,
+        chunk_coords=(cx, cy, cz),
+        global_chunks_per_dim=chunks_per_dim.tolist(),
+        volume_bounds=self.volume_bounds,
+        split_at_branches=bool(split_at_branches),
       )
+      self.chunk_index += 1  # Move to the next chunk
+      return task
 
     def synapses_for_bbox(self, shape, offset):
       """
@@ -378,7 +413,8 @@ def on_finish(self):
           'cross_sectional_area_smoothing_window': int(cross_sectional_area_smoothing_window),
           'cross_sectional_area_repair_sec_per_label': int(cross_sectional_area_repair_sec_per_label),
           'root_ids_cloudpath': root_ids_cloudpath,
-          'fill_holes': int(fill_holes)
+          'fill_holes': int(fill_holes),
+          'split_at_branches': bool(split_at_branches),
         },
         'by': operator_contact(),
         'date': strftime('%Y-%m-%d %H:%M %Z'),
diff --git a/igneous/tasks/skeleton.py b/igneous/tasks/skeleton.py
index a58de88a..a8959179 100644
--- a/igneous/tasks/skeleton.py
+++ b/igneous/tasks/skeleton.py
@@ -1,4 +1,4 @@
-from typing import Optional, Sequence, Dict, List
+from typing import Optional, Sequence, Dict, List, Tuple
 
 from functools import reduce, partial
 import itertools
@@ -88,6 +88,12 @@ def __init__(
     fix_autapses:bool = False,
     timestamp:Optional[int] = None,
     root_ids_cloudpath:Optional[str] = None,
+    # NEW: Add chunk indexing parameters
+    chunk_index:Optional[int] = None,
+    chunk_coords:Optional[Tuple[int,int,int]] = None,
+    global_chunks_per_dim:Optional[List[int]] = None,
+    volume_bounds:Optional[Bbox] = None,
+    split_at_branches:bool = False,
   ):
     super().__init__(
       cloudpath, shape, offset, mip, 
@@ -103,7 +109,17 @@ def __init__(
       bool(dry_run), bool(strip_integer_attributes),
       bool(fix_autapses), timestamp,
       root_ids_cloudpath,
+      chunk_index, chunk_coords, global_chunks_per_dim, volume_bounds,
+      bool(split_at_branches),
     )
+    # Store chunk information
+    self.chunk_index = chunk_index
+    self.chunk_coords = chunk_coords  # (cx, cy, cz)
+    self.global_chunks_per_dim = global_chunks_per_dim
+    self.volume_bounds = volume_bounds
+
+    self.split_at_branches = split_at_branches
+
     if isinstance(self.frag_path, str):
       self.frag_path = cloudfiles.paths.normalize(self.frag_path)
     self.bounds = Bbox(offset, Vec(*shape) + Vec(*offset))
@@ -219,6 +235,9 @@ def decompress_all_labels():
     for sid, skel in skeletons.items():
       skel.id = sid
 
+    if self.split_at_branches:
+      skeletons = self.split_and_reassign_ids(skeletons, vol, bbox)
+
     if self.cross_sectional_area: # This is expensive!
       skeletons = self.compute_cross_sectional_area(vol, bbox, skeletons)
 
@@ -602,6 +621,261 @@ def reprocess_skel(pts, skel):
     vol.image.fill_missing = fill_missing
 
     return skeletons
+  
+  def split_and_reassign_ids(self, skeletons, vol, bbox):
+    """
+    Split skeletons at branch points.
+    Keep label=1 for surface-touching fragments (need merging).
+    Assign unique IDs to interior skeletons (finalized).
+    """
+    surface_fragments = []  # Will all become label=1
+    interior_skeletons = {}  # Get unique IDs
+    
+    next_interior_id = self.generate_base_id_for_chunk()
+    print(f"DEBUG: Processing {len(skeletons)} original skeletons in chunk {self.chunk_index}")
+    print(f"DEBUG: Base ID for interior skeletons: {next_interior_id}")
+    print(f"DEBUG: Chunk bbox: {bbox}")
+    print(f"DEBUG: Volume resolution: {vol.resolution}")
+    
+    for label, skel in skeletons.items():
+        print(f"DEBUG: Processing skeleton {label} with {len(skel.vertices)} vertices")
+        
+        # Debug: Check original skeleton boundary touching
+        touches_original = self.skeleton_touches_surface(skel, vol.resolution)
+        print(f"DEBUG: Original skeleton {label} touches surface: {touches_original}")
+        
+        # Split at branches
+        sub_skels = self.split_skeleton_at_branches(skel)
+        print(f"DEBUG: Split into {len(sub_skels)} sub-skeletons")
+        
+        for i, sub_skel in enumerate(sub_skels):
+            print(f"DEBUG: Sub-skeleton {i} has {len(sub_skel.vertices)} vertices")
+            # Add safety check for empty skeletons
+            if len(sub_skel.vertices) == 0 or len(sub_skel.edges) == 0:
+                print(f"DEBUG: Sub-skeleton {i} is empty, skipping")
+                continue
+            
+            # Debug vertex positions
+            vertices_voxels = sub_skel.vertices / vol.resolution
+            min_coords = np.min(vertices_voxels, axis=0)
+            max_coords = np.max(vertices_voxels, axis=0)
+            print(f"DEBUG: Sub-skeleton {i} vertex range: min={min_coords}, max={max_coords}")
+            
+            touches_surface = self.skeleton_touches_surface(sub_skel, vol.resolution)
+            print(f"DEBUG: Sub-skeleton {i} touches surface: {touches_surface}")
+            
+            if touches_surface:
+                print(f"DEBUG: Sub-skeleton {i} -> SURFACE FRAGMENT (ID=1)")
+                surface_fragments.append(sub_skel)
+            else:
+                print(f"DEBUG: Sub-skeleton {i} -> INTERIOR SKELETON (ID={next_interior_id})")
+                sub_skel.id = next_interior_id
+                interior_skeletons[next_interior_id] = sub_skel
+                next_interior_id += 1
+    
+    print(f"DEBUG: Final counts - Surface fragments: {len(surface_fragments)}, Interior skeletons: {len(interior_skeletons)}")
+    print(f"DEBUG: Interior skeleton IDs: {list(interior_skeletons.keys())}")
+    
+    # Merge all surface fragments into single label=1 skeleton
+    result = {}
+    if surface_fragments:
+        if len(surface_fragments) == 1:
+            result[1] = surface_fragments[0]
+            result[1].id = 1
+        else:
+            # Use osteoid.Skeleton.simple_merge
+            from osteoid import Skeleton
+            merged = Skeleton.simple_merge(surface_fragments)
+            merged.id = 1
+            result[1] = merged
+    
+    # Add all interior skeletons
+    result.update(interior_skeletons)
+    
+    return result
+  
+  def split_skeleton_at_branches(self, skeleton):
+    """
+    Split skeleton at branch points by removing branch nodes and finding connected components.
+    Works with osteoid.Skeleton objects from Kimimaro.
+    """
+    # Get branch nodes using osteoid.Skeleton method
+    branch_nodes = skeleton.branches()
+    
+    if len(branch_nodes) == 0:
+        return [skeleton]
+    
+    # Create mask to remove branch nodes
+    mask = np.ones(len(skeleton.vertices), dtype=bool)
+    mask[branch_nodes] = False
+
+    # Create a mapping from old indices to new indices
+    old_to_new_indices = np.full(len(skeleton.vertices), -1, dtype=int)
+    old_to_new_indices[mask] = np.arange(np.sum(mask))
+
+    # Get vertices without branch nodes
+    filtered_vertices = skeleton.vertices[mask]
+    filtered_radius = skeleton.radius[mask] if skeleton.radius is not None else None
+
+    # Remove edges that contain branch nodes
+    valid_edges = skeleton.edges[~np.isin(skeleton.edges, branch_nodes).any(axis=1)]
+
+    if len(valid_edges) == 0:
+        return []
+
+    # Remap the edges to the new vertex indices
+    remapped_edges = old_to_new_indices[valid_edges]
+
+    # Find connected components in the filtered graph
+    components = self._find_connected_components(remapped_edges, len(filtered_vertices))
+
+    # Create new skeletons for each component
+    sub_skeletons = []
+    for i, component in enumerate(components):
+        if len(component) < 2:
+            continue
+            
+        # Create mapping for this component
+        component_old_to_new = {old_idx: new_idx for new_idx, old_idx in enumerate(component)}
+        
+        # Extract vertices and radius for this component
+        component_vertices = filtered_vertices[component]
+        component_radius = filtered_radius[component] if filtered_radius is not None else None
+        
+        # Extract edges for this component
+        component_edges = []
+        for edge in remapped_edges:
+            if edge[0] in component_old_to_new and edge[1] in component_old_to_new:
+                new_edge = [component_old_to_new[edge[0]], component_old_to_new[edge[1]]]
+                component_edges.append(new_edge)
+        
+        if len(component_edges) > 0:
+            # Create new osteoid.Skeleton - use the correct constructor
+            from osteoid import Skeleton
+            new_skeleton = Skeleton()
+            new_skeleton.vertices = component_vertices.copy()
+            new_skeleton.edges = np.array(component_edges, dtype=skeleton.edges.dtype)
+            if component_radius is not None:
+                new_skeleton.radius = component_radius.copy()
+            new_skeleton.id = f"{skeleton.id}_{i}" if hasattr(skeleton, 'id') else f"skel_{i}"
+            
+            # Copy other attributes if they exist
+            if hasattr(skeleton, 'vertex_types') and skeleton.vertex_types is not None:
+                try:
+                    new_skeleton.vertex_types = skeleton.vertex_types[mask][component].copy()
+                except:
+                    pass  # vertex_types might not be compatible
+            
+            sub_skeletons.append(new_skeleton)
+    
+    return sub_skeletons if sub_skeletons else []
+  
+  def _find_connected_components(self, edges, num_vertices):
+    """
+    Find connected components using Union-Find (Disjoint Set Union).
+    Returns list of components, where each component is a list of vertex indices.
+    """
+    # Initialize Union-Find structure
+    parent = list(range(num_vertices))
+    
+    def find(x):
+        if parent[x] != x:
+            parent[x] = find(parent[x])  # Path compression
+        return parent[x]
+    
+    def union(x, y):
+        root_x = find(x)
+        root_y = find(y)
+        if root_x != root_y:
+            parent[root_x] = root_y
+    
+    # Union vertices connected by edges
+    for edge in edges:
+        union(edge[0], edge[1])
+    
+    # Group vertices by their root parent
+    from collections import defaultdict
+    components_dict = defaultdict(list)
+    for vertex in range(num_vertices):
+        root = find(vertex)
+        components_dict[root].append(vertex)
+    
+    # Convert to list of components
+    components = list(components_dict.values())
+    
+    # Filter out single-vertex components (isolated vertices)
+    components = [comp for comp in components if len(comp) > 1]
+    
+    return components
+    
+  def skeleton_touches_surface(self, skeleton, resolution, tolerance_voxels=1):
+    """Check if any vertex touches the chunk boundary in LOCAL VOXEL space."""
+    
+    # Vertices are already in local voxel coordinates at this point
+    vertices_voxels = skeleton.vertices / resolution
+    
+    # Get chunk shape directly
+    chunk_shape = Vec(*self.shape)
+    
+    print(f"DEBUG SURFACE: Checking {len(vertices_voxels)} vertices")
+    print(f"DEBUG SURFACE: Chunk shape: {chunk_shape}")
+    print(f"DEBUG SURFACE: Local bounds: [0,0,0] to {chunk_shape}")
+    print(f"DEBUG SURFACE: Tolerance: {tolerance_voxels} voxels")
+    
+    # Check against local chunk boundaries (0 to chunk_shape in each dimension)
+    for dim in range(3):
+        # Check if vertices touch the minimum boundary (near 0)
+        near_min = np.any(vertices_voxels[:, dim] <= tolerance_voxels)
+        # Check if vertices touch the maximum boundary (near chunk_shape)
+        near_max = np.any(vertices_voxels[:, dim] >= chunk_shape[dim] - tolerance_voxels)
+        
+        if near_min or near_max:
+            print(f"DEBUG SURFACE: SURFACE TOUCH detected in dimension {dim}")
+            return True
+    
+    print(f"DEBUG SURFACE: NO SURFACE TOUCH detected")
+    return False
+    
+  def generate_base_id_for_chunk(self):
+    """Generate starting ID for interior skeletons using global chunk indexing."""
+    print(f"DEBUG: chunk_index={self.chunk_index}, coords={self.chunk_coords}")
+    
+    if self.chunk_index is not None:
+        base_id = (self.chunk_index + 1) * 1000000 + 1000
+        print(f"DEBUG: Generated base_id={base_id}")
+        return int(base_id)
+    
+    print("DEBUG: No chunk_index, using fallback")
+    return 1000000
+  
+  def extract_subskeleton(self, skeleton, vertex_indices):
+    """Extract subset of vertices/edges as new osteoid.Skeleton."""
+    vertex_set = set(vertex_indices)
+    old_to_new = {old_idx: new_idx for new_idx, old_idx in enumerate(vertex_indices)}
+    
+    # Create new osteoid.Skeleton
+    from osteoid import Skeleton
+    new_skel = Skeleton()
+    new_skel.vertices = skeleton.vertices[vertex_indices].copy()
+    if skeleton.radius is not None:
+        new_skel.radius = skeleton.radius[vertex_indices].copy()
+    
+    # Extract edges with both endpoints in vertex set
+    valid_edges = []
+    for edge in skeleton.edges:
+        if edge[0] in vertex_set and edge[1] in vertex_set:
+            valid_edges.append([old_to_new[edge[0]], old_to_new[edge[1]]])
+    
+    new_skel.edges = np.array(valid_edges, dtype=skeleton.edges.dtype) if valid_edges else np.array([], dtype=skeleton.edges.dtype).reshape(0, 2)
+    
+    # Copy attributes
+    if hasattr(skeleton, 'vertex_types') and skeleton.vertex_types is not None:
+        try:
+            new_skel.vertex_types = skeleton.vertex_types[vertex_indices].copy()
+        except:
+            pass
+    
+    return new_skel
 
   def apply_global_dust_threshold(self, vol, all_labels, mapping):
     path = vol.meta.join(self.cloudpath, vol.key, 'stats', 'voxel_counts.im')
diff --git a/igneous/tasks/skeleton_mod.py b/igneous/tasks/skeleton_mod.py
new file mode 100644
index 00000000..3671987c
--- /dev/null
+++ b/igneous/tasks/skeleton_mod.py
@@ -0,0 +1,1292 @@
+from typing import Optional, Sequence, Dict, List
+
+from functools import reduce
+import itertools
+import json
+import mmap
+import pickle
+import posixpath
+import os
+import re
+from collections import defaultdict
+
+from tqdm import tqdm
+
+import numpy as np
+
+import mapbuffer
+from mapbuffer import MapBuffer, IntMap
+import cloudfiles
+from cloudfiles import CloudFiles, CloudFile
+
+import cloudvolume
+from cloudvolume import CloudVolume, Skeleton, paths
+from cloudvolume.lib import Vec, Bbox, sip, xyzrange
+from cloudvolume.datasource.precomputed.sharding import synthesize_shard_files
+
+import cc3d
+import crackle
+import fastmorph
+import fastremap
+import kimimaro
+
+from taskqueue import RegisteredTask, queueable
+
+SEGIDRE = re.compile(r'/(\d+):.*?$')
+
+def filename_to_segid(filename):
+  matches = SEGIDRE.search(filename)
+  if matches is None:
+    raise ValueError("There was an issue with the fragment filename: " + filename)
+
+  segid, = matches.groups()
+  return int(segid)
+
+def strip_integer_attributes(skeletons):
+  for skel in skeletons:
+    skel.extra_attributes = [ 
+    attr for attr in skel.extra_attributes 
+    if attr['data_type'] in ('float32', 'float64')
+  ]
+  return skeletons
+
+class SkeletonTask(RegisteredTask):
+  """
+  Stage 1 of skeletonization.
+
+  Convert chunks of segmentation into chunked skeletons and point clouds.
+  They will be merged in the stage 2 task SkeletonMergeTask.
+  """
+  def __init__(
+    self, cloudpath:str, 
+    shape:Sequence[int], offset:Sequence[int], 
+    mip:int, teasar_params:dict, will_postprocess:bool,
+    info:dict = None, 
+    object_ids:Optional[Sequence[int]] = None,
+    mask_ids:Optional[Sequence[int]] = None,
+    fix_branching:bool = True,
+    fix_borders:bool = True,
+    fix_avocados:bool = False,
+    fill_holes:int = 0,
+    dust_threshold:int = 1000, 
+    progress:bool = False,
+    parallel:int = 1,
+    fill_missing:bool = False,
+    sharded:bool = False,
+    frag_path:Optional[str] = None, 
+    spatial_index:bool = True,
+    spatial_grid_shape:Optional[Sequence[int]] = None,
+    synapses:Optional[Sequence[Sequence[float]]] = None, 
+    dust_global:bool = False,
+    cross_sectional_area:bool = False,
+    cross_sectional_area_smoothing_window:int = 1,
+    cross_sectional_area_shape_delta:int = 150,
+    dry_run:bool = False,
+    strip_integer_attributes:bool = True,
+    fix_autapses:bool = False,
+    timestamp:Optional[int] = None,
+    root_ids_cloudpath:Optional[str] = None,
+  ):
+    super().__init__(
+      cloudpath, shape, offset, mip, 
+      teasar_params, will_postprocess, 
+      info, object_ids, mask_ids,
+      fix_branching, fix_borders, 
+      fix_avocados, fill_holes,
+      dust_threshold, progress, parallel,
+      fill_missing, bool(sharded), frag_path, bool(spatial_index),
+      spatial_grid_shape, synapses, bool(dust_global),
+      bool(cross_sectional_area), int(cross_sectional_area_smoothing_window),
+      int(cross_sectional_area_shape_delta),
+      bool(dry_run), bool(strip_integer_attributes),
+      bool(fix_autapses), timestamp,
+      root_ids_cloudpath,
+    )
+    if isinstance(self.frag_path, str):
+      self.frag_path = cloudfiles.paths.normalize(self.frag_path)
+    self.bounds = Bbox(offset, Vec(*shape) + Vec(*offset))
+    self.index_bounds = Bbox(offset, Vec(*spatial_grid_shape) + Vec(*offset))
+
+    # aggressive morphological hole filling has a 1-2vx 
+    # edge effect that needs to be cropped away
+    self.hole_filling_padding = (self.fill_holes >= 3) * 2
+
+  def execute(self):
+    # For graphene volumes, if we've materialized the root IDs
+    # into a static archive, let's use that because it's way more
+    # efficient for fetching root IDs.
+    cloudpath = self.cloudpath
+    if self.root_ids_cloudpath:
+      cloudpath = self.root_ids_cloudpath
+
+    lru_bytes = 0
+    lru_encoding = 'same'
+
+    if self.cross_sectional_area:
+      lru_bytes = self.bounds.size() + 2 * self.cross_sectional_area_shape_delta
+      lru_bytes = lru_bytes[0] * lru_bytes[1] * lru_bytes[2] * 8 // 500
+      lru_encoding = 'crackle'
+
+    vol = CloudVolume(
+      cloudpath,
+      mip=self.mip,
+      bounded=(self.hole_filling_padding == 0),
+      info=self.info,
+      cdn_cache=False,
+      parallel=self.parallel,
+      fill_missing=self.fill_missing,
+      lru_bytes=lru_bytes,
+      lru_encoding=lru_encoding,
+    )
+    bbox = Bbox.clamp(self.bounds, vol.bounds)
+    index_bbox = Bbox.clamp(self.index_bounds, vol.bounds)
+
+    bbox.minpt -= self.hole_filling_padding
+    bbox.maxpt += self.hole_filling_padding
+
+    path = vol.info.get("skeletons", "skeletons")
+    if self.frag_path is None:
+      path = vol.meta.join(self.cloudpath, path)
+    else:
+      # if the path is to a volume root, follow the info instructions,
+      # otherwise place the files exactly where frag path says to
+      test_path = CloudFiles(self.frag_path).join(self.frag_path, "info")
+      test_info = CloudFile(test_path).get_json()
+      if test_info is not None and 'scales' in test_info:
+        path = CloudFiles(self.frag_path).join(self.frag_path, path)
+      else:
+        path = self.frag_path
+
+    all_labels = vol.download(
+      bbox.to_slices(), 
+      agglomerate=True, 
+      timestamp=self.timestamp
+    )
+    all_labels = all_labels[:,:,:,0]
+
+    if self.mask_ids:
+      all_labels = fastremap.mask(all_labels, self.mask_ids)
+
+    extra_targets_after = {}
+    if self.synapses:
+      extra_targets_after = kimimaro.synapses_to_targets(
+        all_labels, self.synapses
+      )
+
+    dust_threshold = self.dust_threshold
+    if self.dust_global and dust_threshold > 0:
+      dust_threshold = 0
+      all_labels = self.apply_global_dust_threshold(vol, all_labels)
+
+    if self.fill_holes and self.fix_autapses:
+      raise ValueError("fill_holes is not currently compatible with fix_autapses")
+
+    voxel_graph = None
+    if self.fix_autapses:
+      voxel_graph = self.voxel_connectivity_graph(vol, bbox, all_labels)
+
+    skeletons = self.skeletonize(
+      all_labels, 
+      vol, 
+      dust_threshold, 
+      extra_targets_after, 
+      voxel_graph,
+    )
+    del all_labels
+
+    if self.cross_sectional_area: # This is expensive!
+      skeletons = self.compute_cross_sectional_area(vol, bbox, skeletons)
+
+    # voxel centered (+0.5) and uses more accurate bounding box from mip 0
+    corrected_offset = (bbox.minpt.astype(np.float32) - vol.meta.voxel_offset(self.mip) + 0.5) * vol.meta.resolution(self.mip)
+    corrected_offset += vol.meta.voxel_offset(0) * vol.meta.resolution(0)
+
+    for segid, skel in skeletons.items():
+      skel.vertices[:] += corrected_offset
+
+    if self.synapses:
+      for segid, skel in skeletons.items():
+        terminal_nodes = skel.vertices[ skel.terminals() ]
+
+        for i, vert in enumerate(terminal_nodes):
+          vert = vert / vol.resolution - self.bounds.minpt
+          vert = tuple(np.round(vert).astype(int))
+          if vert in extra_targets_after.keys():
+            skel.vertex_types[i] = extra_targets_after[vert]
+    
+    # old versions of neuroglancer don't
+    # support int attributes
+    if self.strip_integer_attributes:
+      strip_integer_attributes(skeletons.values())
+
+    if self.dry_run:
+      return skeletons
+
+    if self.sharded:
+      self.upload_batch(vol, path, index_bbox, skeletons)
+    else:
+      self.upload_individuals(vol, path, bbox, skeletons)
+
+    if self.spatial_index:
+      self.upload_spatial_index(vol, path, index_bbox, skeletons)
+
+  def _do_operation(self, all_labels, fn):
+    if self.fill_holes > 0:
+      filled_labels, hole_labels = fastmorph.fill_holes(
+        all_labels,
+        remove_enclosed=True,
+        return_removed=True,
+        fix_borders=(self.fill_holes >= 2),
+        morphological_closing=(self.fill_holes >= 3),
+      )
+
+      if self.fill_holes >= 3:
+        hp = self.hole_filling_padding
+        all_labels = np.asfortranarray(all_labels[hp:-hp,hp:-hp,hp:-hp])
+        filled_labels= np.asfortranarray(filled_labels[hp:-hp,hp:-hp,hp:-hp])
+
+      all_labels = crackle.compress(all_labels)
+      skeletons = fn(filled_labels)
+      del filled_labels
+
+      all_labels = crackle.decompress(all_labels)
+      hole_labels = all_labels * np.isin(all_labels, list(hole_labels))
+      del all_labels
+
+      hole_skeletons = fn(hole_labels)
+      skeletons.update(hole_skeletons)
+      del hole_labels
+      del hole_skeletons
+    else:
+      skeletons = fn(all_labels)
+
+    return skeletons
+
+  def skeletonize(
+    self, 
+    all_labels:np.ndarray, 
+    vol:CloudVolume, 
+    dust_threshold:int, 
+    extra_targets_after:dict, 
+    voxel_graph:np.ndarray,
+  ) -> dict:
+    def do_skeletonize(labels):
+      return kimimaro.skeletonize(
+        labels, self.teasar_params, 
+        object_ids=self.object_ids, 
+        anisotropy=vol.resolution,
+        dust_threshold=dust_threshold, 
+        progress=self.progress, 
+        fix_branching=self.fix_branching,
+        fix_borders=self.fix_borders,
+        fix_avocados=self.fix_avocados,
+        fill_holes=False, # moved this logic into SkeletonTask / fastmorph
+        parallel=self.parallel,
+        extra_targets_after=extra_targets_after.keys(),
+        voxel_graph=voxel_graph,
+      )
+
+    return self._do_operation(all_labels, do_skeletonize)
+
+  def voxel_connectivity_graph(
+    self, 
+    vol:CloudVolume, 
+    bbox:Bbox, 
+    root_labels:np.ndarray,
+  ) -> np.ndarray:
+
+    if vol.meta.path.format != "graphene":
+      vol = CloudVolume(
+        self.cloudpath, mip=self.mip, 
+        info=self.info, cdn_cache=False,
+        parallel=self.parallel, 
+        fill_missing=self.fill_missing,
+      )
+
+    if vol.meta.path.format != "graphene":
+      raise ValueError("Can't extract a voxel connectivity graph from non-graphene volumes.")
+
+    layer_2 = vol.download(
+      bbox, 
+      stop_layer=2,
+      agglomerate=True,
+      timestamp=self.timestamp,
+    )[...,0]
+
+    graph_chunk_size = np.array(vol.meta.graph_chunk_size) / vol.meta.downsample_ratio(vol.mip)
+    graph_chunk_size = graph_chunk_size.astype(int)
+
+    shape = bbox.size()[:3]
+    sgx, sgy, sgz = list(np.ceil(shape / graph_chunk_size).astype(int))
+
+    vcg = cc3d.voxel_connectivity_graph(layer_2, connectivity=26)
+    del layer_2
+
+    # the proper way to do this would be to get the lowest the L3..LN root
+    # as needed, but the lazy way to do this is to get the root labels
+    # which will retain a few errors, but overall the error rate should be
+    # over 100x less. We need to shade in the sides of the connectivity graph
+    # with edges that represent the connections between the adjacent boxes.
+
+    root_vcg = cc3d.voxel_connectivity_graph(root_labels, connectivity=26)
+    clamp_box = Bbox([0,0,0], shape)
+
+    for gx,gy,gz in xyzrange([sgx, sgy, sgz]):
+      bbx = Bbox((gx,gy,gz), (gx+1, gy+1, gz+1))
+      bbx *= graph_chunk_size
+      bbx = Bbox.clamp(bbx, clamp_box)
+
+      slicearr = []
+      for i in range(3):
+        bbx1 = bbx.clone()
+        bbx1.maxpt[i] = bbx1.minpt[i] + 1
+        slicearr.append(bbx1)
+
+        bbx1 = bbx.clone()
+        bbx1.minpt[i] = bbx1.maxpt[i] - 1
+        slicearr.append(bbx1)
+
+      for bbx1 in slicearr:
+        vcg[bbx1.to_slices()] = root_vcg[bbx1.to_slices()] 
+
+    return vcg
+
+  def compute_cross_sectional_area(self, vol, bbox, skeletons):
+    if len(skeletons) == 0:
+      return skeletons
+
+    # Why redownload a bigger image? In order to avoid clipping the
+    # cross sectional areas on the edges.
+    delta = int(self.cross_sectional_area_shape_delta)
+
+    big_bbox = bbox.clone()
+    big_bbox.grow(delta)
+    big_bbox = Bbox.clamp(big_bbox, vol.bounds)
+
+    big_bbox.minpt -= self.hole_filling_padding
+    big_bbox.maxpt += self.hole_filling_padding
+
+    all_labels = vol[big_bbox][...,0]
+
+    delta = bbox.minpt - big_bbox.minpt
+
+    # place the skeletons in exactly the same position
+    # in the enlarged image
+    for skel in skeletons.values():
+      skel.vertices += delta * vol.resolution
+
+    if self.mask_ids:
+      all_labels = fastremap.mask(all_labels, self.mask_ids)
+
+    def do_cross_section(labels):
+      return kimimaro.cross_sectional_area(
+        labels, skeletons,
+        anisotropy=vol.resolution,
+        smoothing_window=self.cross_sectional_area_smoothing_window,
+        progress=self.progress,
+        in_place=True,
+        fill_holes=False,
+      )
+
+    skeletons = self._do_operation(all_labels, do_cross_section)
+    del all_labels
+
+    # move the vertices back to their old smaller image location
+    for skel in skeletons.values():
+      skel.vertices -= delta * vol.resolution
+
+    return self.repair_cross_sectional_area_contacts(vol, bbox, skeletons)
+
+  def repair_cross_sectional_area_contacts(self, vol, bbox, skeletons):
+    from dbscan import DBSCAN
+
+    boundaries = [
+      bbox.minpt.x == vol.bounds.minpt.x,
+      bbox.maxpt.x == vol.bounds.maxpt.x,
+      bbox.minpt.y == vol.bounds.minpt.y,
+      bbox.maxpt.y == vol.bounds.maxpt.y,
+      bbox.minpt.z == vol.bounds.minpt.z,
+      bbox.maxpt.z == vol.bounds.maxpt.z,
+    ]
+
+    if all(boundaries):
+      return skeletons
+
+    invalid_repairs = 0
+    for i, bnd in enumerate(boundaries):
+      invalid_repairs |= (bnd << i)
+
+    invalid_repairs = (~np.uint8(invalid_repairs)) & np.uint8(0b00111111)
+
+    # We want to repair any skeleton that has a contact with the
+    # edge except those that are contacting the volume boundary due to futility
+
+    repair_skels = []
+    for skel in skeletons.values():
+      contacts = skel.cross_sectional_area_contacts & invalid_repairs
+      if np.any(contacts):
+        repair_skels.append(skel)
+
+    delta = int(self.cross_sectional_area_shape_delta)
+
+    shape = bbox.size3()
+    
+    def reprocess_skel(pts, skel):
+      pts_bbx = Bbox.from_points(pts)
+
+      pts_bbx_vol = pts_bbx + bbox.minpt
+      center = pts_bbx_vol.center().astype(int)
+      skel_bbx = Bbox(center, center+1)
+      skel_bbx.grow(delta + shape // 2)
+
+      skel_bbx = Bbox.clamp(skel_bbx, vol.bounds)
+
+      skel_bbx.minpt -= self.hole_filling_padding
+      skel_bbx.maxpt += self.hole_filling_padding
+
+      binary_image = vol.download(
+        skel_bbx, mip=vol.mip, label=skel.id
+      )[...,0]
+
+      diff = bbox.minpt - skel_bbx.minpt
+      skel.vertices += diff * vol.resolution
+
+      # we binarized the label for memory's sake, 
+      # so need to harmonize that with the skeleton ID
+      segid = skel.id
+      skel.id = 1
+
+      if self.fill_holes > 0:
+        binary_image = fastmorph.fill_holes(
+          binary_image,
+          fix_borders=(self.fill_holes >= 2),
+          morphological_closing=(self.fill_holes >= 3),
+        )
+        if self.fill_holes >= 3:
+          hp = self.hole_filling_padding
+          binary_image = np.asfortranarray(binary_image[hp:-hp,hp:-hp,hp:-hp])
+
+      kimimaro.cross_sectional_area(
+        binary_image, skel,
+        anisotropy=vol.resolution,
+        smoothing_window=self.cross_sectional_area_smoothing_window,
+        progress=self.progress,
+        in_place=True,
+        fill_holes=False,
+        repair_contacts=True,
+      )
+      skel.id = segid
+      skel.vertices -= diff * vol.resolution
+
+    for skel in repair_skels:
+      verts = (skel.vertices // vol.resolution).astype(int)
+      reprocess_skel(verts, skel)
+
+      pts = verts[skel.cross_sectional_area_contacts > 0]
+      if len(pts) == 0:
+        continue
+
+      labels, core_samples_mask = DBSCAN(pts, eps=5, min_samples=2)
+      uniq = fastremap.unique(labels)
+      for lbl in uniq:
+        reprocess_skel(pts[labels == lbl], skel)
+
+    return skeletons
+
+  def apply_global_dust_threshold(self, vol, all_labels):
+    path = vol.meta.join(self.cloudpath, vol.key, 'stats', 'voxel_counts.im')
+    cf = CloudFile(path)
+    memcf = CloudFile(path.replace(f"{cf.protocol}://", "mem://"))
+
+    if not cf.exists():
+      raise FileNotFoundError(f"Cannot apply global dust threshold without {path}")
+
+    buf = None
+    if memcf.exists():
+      buf = memcf.get()
+    else:
+      cloudfiles.clear_memory()
+
+    if buf is None:
+      if cf.protocol != "file":
+        buf = cf.get()
+        memcf.put(buf, compress='zstd')
+      else:
+        buf = cf
+
+    mb = IntMap(buf)
+    uniq = fastremap.unique(all_labels)
+
+    valid_objects = []
+    for label in uniq:
+      if label == 0:
+        continue
+      if mb[label] >= self.dust_threshold:
+        valid_objects.append(label)
+
+    return fastremap.mask_except(all_labels, valid_objects)
+
+  def upload_batch(self, vol, path, bbox, skeletons):
+    mbuf = MapBuffer(
+      skeletons, compress="br", 
+      tobytesfn=lambda skel: skel.to_precomputed()
+    )
+
+    cf = CloudFiles(path, progress=vol.progress)
+    cf.put(
+      path="{}.frags".format(bbox.to_filename()),
+      content=mbuf.tobytes(),
+      compress=None,
+      content_type="application/x-mapbuffer",
+      cache_control=False,
+    )
+
+  def upload_individuals(self, vol, path, bbox, skeletons):
+    skeletons = skeletons.values()
+
+    if not self.will_postprocess:
+      vol.skeleton.upload(skeletons)
+      return 
+
+    # Split skeletons at branch points with boundary information
+    all_fragments = []
+    all_boundary_info = []
+    
+    for skel in skeletons:
+      fragments_with_info = split_skeleton_with_boundary_info(skel, bbox)
+      for fragment, boundary_info in fragments_with_info:
+        all_fragments.append(fragment)
+        all_boundary_info.append(boundary_info)
+
+    bbox_scaled = bbox * vol.resolution
+    cf = CloudFiles(path, progress=vol.progress)
+    
+    # Store fragments with their boundary information
+    uploads = []
+    for fragment, boundary_info in zip(all_fragments, all_boundary_info):
+      # Store the fragment
+      fragment_filename = f"{fragment.id}:{bbox_scaled.to_filename()}"
+      uploads.append((fragment_filename, pickle.dumps(fragment)))
+      
+      # Store boundary information separately for merge reconstruction
+      boundary_filename = f"{fragment.id}:{bbox_scaled.to_filename()}.boundary"
+      uploads.append((boundary_filename, pickle.dumps(boundary_info)))
+    
+    cf.puts(uploads, compress='gzip', content_type="application/python-pickle", cache_control=False)
+
+  def upload_spatial_index(self, vol, path, bbox, skeletons):
+    # Create fragment-based spatial index
+    fragment_spatial_index = {}
+    boundary_connections = {}
+    
+    for skel in skeletons.values():
+      fragments_with_info = split_skeleton_with_boundary_info(skel, bbox)
+      
+      for fragment, boundary_info in fragments_with_info:
+        # Index fragment location
+        fragment_bbox = Bbox.from_points(fragment.vertices)
+        fragment_spatial_index[fragment.id] = {
+          'bbox': fragment_bbox.to_list(),
+          'original_segment': boundary_info['original_segment_id'],
+          'chunk_bbox': boundary_info['chunk_bbox']
+        }
+        
+        # Track boundary connections for merge reconstruction
+        if boundary_info['boundary_vertices']:
+          boundary_connections[fragment.id] = {
+            'boundary_vertices': boundary_info['boundary_vertices'],
+            'connections': boundary_info['connections'],
+            'chunk_bbox': boundary_info['chunk_bbox']
+          }
+
+    bbox_scaled = bbox.astype(vol.resolution.dtype) * vol.resolution
+    precision = vol.skeleton.spatial_index.precision
+    cf = CloudFiles(path, progress=vol.progress)
+    
+    # Store fragment spatial index
+    cf.put_json(
+      path=f"{bbox_scaled.to_filename(precision)}.spatial",
+      content=fragment_spatial_index,
+      compress='gzip',
+      cache_control=False,
+    )
+    
+    # Store boundary connection information for merge
+    cf.put_json(
+      path=f"{bbox_scaled.to_filename(precision)}.connections",
+      content=boundary_connections,
+      compress='gzip',
+      cache_control=False,
+    )
+
+class UnshardedSkeletonMergeTask(RegisteredTask):
+  """
+  Stage 2 of skeletonization.
+
+  Merge chunked TEASAR skeletons into a single skeleton.
+
+  If we parallelize using prefixes single digit prefixes ['0','1',..'9'] all meshes will
+  be correctly processed. But if we do ['10','11',..'99'] meshes from [0,9] won't get
+  processed and need to be handle specifically by creating tasks that will process
+  a single mesh ['0:','1:',..'9:']
+  """
+  def __init__(
+      self, cloudpath, prefix, 
+      crop=0, dust_threshold=4000, max_cable_length=None,
+      tick_threshold=6000, delete_fragments=False
+    ):
+    super(UnshardedSkeletonMergeTask, self).__init__(
+      cloudpath, prefix, crop, 
+      dust_threshold, max_cable_length,
+      tick_threshold, delete_fragments
+    )
+    self.max_cable_length = float(max_cable_length) if max_cable_length is not None else None
+
+  def execute(self):
+    self.vol = CloudVolume(self.cloudpath, cdn_cache=False)
+    self.vol.mip = self.vol.skeleton.meta.mip
+
+    fragment_filenames = self.get_filenames()
+    skels = self.get_skeletons_by_segid(fragment_filenames)
+
+    skeletons = []
+    for segid, frags in skels.items():
+      skeleton = self.fuse_skeletons(frags)
+      # if self.max_cable_length is None or skeleton.cable_length() <= self.max_cable_length:
+      #   skeleton = kimimaro.postprocess(
+      #     skeleton, self.dust_threshold, self.tick_threshold
+      #   )
+      skeleton.id = segid
+      skeletons.append(skeleton)
+
+    self.vol.skeleton.upload(skeletons)
+    
+    if self.delete_fragments:
+      cf = CloudFiles(self.cloudpath, progress=True)
+      cf.delete(fragment_filenames)
+
+  def get_filenames(self):
+    prefix = '{}/{}'.format(self.vol.skeleton.path, self.prefix)
+
+    cf = CloudFiles(self.cloudpath, progress=True)
+    return [ _ for _ in cf.list(prefix=prefix) ]
+
+  def get_skeletons_by_segid(self, filenames):
+    cf = CloudFiles(self.cloudpath, progress=False)
+    skels = cf.get(filenames)
+
+    skeletons = defaultdict(list)
+    for skel in skels:
+      try:
+        segid = filename_to_segid(skel['path'])
+      except ValueError:
+        # Typically this is due to preexisting fully
+        # formed skeletons e.g. skeletons_mip_3/1588494
+        continue
+
+      skeletons[segid].append( 
+        (
+          Bbox.from_filename(skel['path']),
+          pickle.loads(skel['content'])
+        )
+      )
+
+    return skeletons
+
+  def fuse_skeletons(self, skels):
+    if len(skels) == 0:
+      return Skeleton()
+
+    bbxs = [ item[0] for item in skels ]
+    skeletons = [ item[1] for item in skels ]
+
+    skeletons = self.crop_skels(bbxs, skeletons)
+    skeletons = [ s for s in skeletons if not s.empty() ]
+
+    if len(skeletons) == 0:
+      return Skeleton()
+
+    return Skeleton.simple_merge(skeletons).consolidate()
+
+  def crop_skels(self, bbxs, skeletons):
+    cropped = [ s.clone() for s in skeletons ]
+
+    if self.crop <= 0:
+      return cropped
+    
+    for i in range(len(skeletons)):
+      bbx = bbxs[i]
+      bbx = bbx.astype(self.vol.resolution.dtype) 
+      bbx.minpt += self.crop * self.vol.resolution
+      bbx.maxpt -= self.crop * self.vol.resolution
+
+      if bbx.volume() <= 0:
+        continue
+
+      cropped[i] = cropped[i].crop(bbx)
+
+    return cropped
+
+class ShardedSkeletonMergeTask(RegisteredTask):
+  def __init__(
+    self, cloudpath, shard_no, 
+    dust_threshold=4000, tick_threshold=6000, frag_path=None, cache=False,
+    spatial_index_db=None, max_cable_length=None
+  ):
+    super(ShardedSkeletonMergeTask, self).__init__(
+      cloudpath, shard_no,  
+      dust_threshold, tick_threshold, frag_path, cache, spatial_index_db,
+      max_cable_length
+    )
+    self.progress = False
+    self.max_cable_length = float(max_cable_length) if max_cable_length is not None else None
+
+  def execute(self):
+    # cache is necessary for local computation, but on GCE download is very fast
+    # so cache isn't necessary.
+    cv = CloudVolume(
+      self.cloudpath, 
+      progress=self.progress,
+      spatial_index_db=self.spatial_index_db,
+      cache=self.cache
+    )
+
+    # This looks messy because we are trying to avoid retaining
+    # unnecessary memory. In the original iteration, this was 
+    # using 50 GB+ memory on minnie65. With changes to this
+    # and the spatial_index, we are getting it down to something reasonable.
+    locations = self.locations_for_labels(
+      labels_for_shard(cv, self.shard_no, self.progress), 
+      cv
+    )
+    filenames = set(itertools.chain(*locations.values()))
+    labels = set(locations.keys())
+    del locations
+    skeletons = self.get_unfused(labels, filenames, cv, self.frag_path)
+    del labels
+    del filenames
+    skeletons = self.process_skeletons(skeletons, in_place=True)
+
+    if len(skeletons) == 0:
+      return
+
+    shard_files = synthesize_shard_files(cv.skeleton.reader.spec, skeletons)
+
+    if len(shard_files) != 1:
+      raise ValueError(
+        "Only one shard file should be generated per task. Expected: {} Got: {} ".format(
+          str(self.shard_no), ", ".join(shard_files.keys())
+      ))
+
+    cf = CloudFiles(cv.skeleton.meta.layerpath, progress=self.progress)
+    cf.puts( 
+      ( (fname, data) for fname, data in shard_files.items() ),
+      compress=False,
+      content_type='application/octet-stream',
+      cache_control='no-cache',      
+    )
+
+  def process_skeletons(self, unfused_skeletons, in_place=False):
+    skeletons = {}
+    if in_place:
+      skeletons = unfused_skeletons
+
+    for label in tqdm(unfused_skeletons.keys(), desc="Postprocessing", disable=(not self.progress)):
+      skels = unfused_skeletons[label]
+      skel = Skeleton.simple_merge(skels)
+      skel.id = label
+      skel.extra_attributes = [ 
+        attr for attr in skel.extra_attributes \
+        if attr['data_type'] == 'float32' 
+      ]
+      skel = skel.consolidate()
+      # if self.max_cable_length is not None and skel.cable_length() > self.max_cable_length:
+      #   skeletons[label] = skel.to_precomputed()
+      # else:
+      #   skeletons[label] = kimimaro.postprocess(
+      #     skel, 
+      #     dust_threshold=self.dust_threshold, # voxels 
+      #     tick_threshold=self.tick_threshold, # nm
+      #   ).to_precomputed()
+      skeletons[label] = skel.to_precomputed()
+
+    return skeletons
+
+  def get_unfused(self, labels, filenames, cv, frag_path):
+    skeldirfn = lambda loc: cv.meta.join(cv.skeleton.meta.skeleton_path, loc)
+    filenames = [ skeldirfn(loc) for loc in filenames ]
+
+    block_size = 50
+
+    if len(filenames) < block_size:
+      blocks = [ filenames ]
+      n_blocks = 1
+    else:
+      n_blocks = max(len(filenames) // block_size, 1)
+      blocks = sip(filenames, block_size)
+
+    frag_prefix = frag_path or cv.cloudpath
+    local_input = False
+    if paths.extract(frag_prefix).protocol == "file":
+       local_input = True
+       frag_prefix = frag_prefix.replace("file://", "", 1)
+
+    all_skels = defaultdict(list)
+    for filenames_block in tqdm(blocks, desc="Filename Block", total=n_blocks, disable=(not self.progress)):
+      if local_input:
+        all_files = {}
+        for filename in filenames_block:
+          all_files[filename] = open(os.path.join(frag_prefix, filename), "rb")
+      else:
+        all_files = { 
+          filename: CloudFile(cv.meta.join(frag_prefix, filename), cache_meta=True)
+          for filename in filenames_block 
+        } 
+      
+      for filename, content in tqdm(all_files.items(), desc="Scanning Fragments", disable=(not self.progress)):
+        fragment = MapBuffer(content, frombytesfn=Skeleton.from_precomputed)
+
+        for label in labels:
+          try:
+            skel = fragment[label]
+            skel.id = label
+            all_skels[label].append(skel)
+          except KeyError:
+            continue
+
+        if hasattr(content, "close"):
+          content.close()
+
+    return all_skels
+
+  def locations_for_labels(self, labels, cv):
+    SPATIAL_EXT = re.compile(r'\.spatial$')
+    index_filenames = cv.skeleton.spatial_index.file_locations_per_label(labels)
+    for label, locations in index_filenames.items():
+      for i, location in enumerate(locations):
+        bbx = Bbox.from_filename(re.sub(SPATIAL_EXT, '', location))
+        bbx /= cv.meta.resolution(cv.skeleton.meta.mip)
+        index_filenames[label][i] = bbx.to_filename() + '.frags'
+    return index_filenames
+
+def labels_for_shard(cv, shard_no, progress):
+  """
+  Try to fetch precalculated labels from `$shardno.labels` (faster) otherwise, 
+  compute which labels are applicable to this shard from the shard index (much slower).
+  """
+  labels = CloudFiles(cv.skeleton.meta.layerpath).get_json(shard_no + '.labels')
+  if labels is not None:
+    return labels
+
+  labels = cv.skeleton.spatial_index.query(cv.bounds * cv.resolution)
+  spec = cv.skeleton.reader.spec
+
+  return [ 
+    lbl for lbl in tqdm(labels, desc="Computing Shard Numbers", disable=(not progress))  \
+    if spec.compute_shard_location(lbl).shard_number == shard_no 
+  ]
+
+@queueable
+def ShardedFromUnshardedSkeletonMergeTask(
+  src:str,
+  dest:str,
+  shard_no:str,
+  cache_control:bool = False,
+  skel_dir:Optional[str] = None,
+  progress:bool = False,
+):
+  cv_src = CloudVolume(src)
+
+  if skel_dir is None and 'skeletons' in cv.info:
+    skel_dir = cv.info['skeletons']
+
+  cv_dest = CloudVolume(dest, skel_dir=skel_dir, progress=progress)
+
+  labels = labels_for_shard(cv_dest, shard_no, progress)
+  skeletons = cv_src.skeleton.get(labels)
+  del labels
+
+  if len(skeletons) == 0:
+    return
+
+  skeletons = strip_integer_attributes(skeletons)
+  skeletons = { skel.id: skel.to_precomputed() for skel in skeletons }
+  shard_files = synthesize_shard_files(cv_dest.skeleton.reader.spec, skeletons)
+
+  if len(shard_files) != 1:
+    raise ValueError(
+      "Only one shard file should be generated per task. Expected: {} Got: {} ".format(
+        str(shard_no), ", ".join(shard_files.keys())
+    ))
+
+  cf = CloudFiles(cv_dest.skeleton.meta.layerpath, progress=progress)
+  cf.puts( 
+    ( (fname, data) for fname, data in shard_files.items() ),
+    compress=False,
+    content_type='application/octet-stream',
+    cache_control='no-cache',      
+  )
+
+@queueable
+def DeleteSkeletonFilesTask(
+  cloudpath:str,
+  prefix:str,
+  skel_dir:Optional[str] = None
+):
+  cv = CloudVolume(cloudpath, skel_dir=skel_dir)
+  cf = CloudFiles(cv.skeleton.meta.layerpath)
+  cf.delete(cf.list(prefix=prefix))
+
+
+@queueable
+def TransferSkeletonFilesTask(
+  src:str,
+  dest:str,
+  prefix:str,
+  skel_dir:Optional[str] = None
+):
+  cv_src = CloudVolume(src)
+  cv_dest = CloudVolume(dest, skel_dir=skel_dir)
+
+  cf_src = CloudFiles(cv_src.skeleton.meta.layerpath)
+  cf_dest = CloudFiles(cv_dest.skeleton.meta.layerpath)
+
+  cf_src.transfer_to(cf_dest, paths=cf_src.list(prefix=prefix))
+
+def split_skeleton_with_boundary_info(skeleton, chunk_bbox):
+  """
+  Split skeleton at branch points while preserving boundary connectivity information.
+  
+  Args:
+    skeleton: CloudVolume Skeleton object
+    chunk_bbox: Bounding box of the current chunk
+    
+  Returns:
+    list: List of (fragment, boundary_info) tuples
+  """
+  if skeleton is None or len(skeleton.vertices) == 0:
+    return []
+    
+  vertices = skeleton.vertices
+  edges = skeleton.edges
+  
+  if len(edges) == 0:
+    boundary_vertices = find_boundary_vertices(vertices, chunk_bbox)
+    boundary_info = {
+      'boundary_vertices': boundary_vertices,
+      'chunk_bbox': chunk_bbox.to_list(),
+      'connections': []
+    }
+    return [(skeleton, boundary_info)]
+  
+  # Build adjacency list
+  adjacency = defaultdict(list)
+  for edge in edges:
+    adjacency[edge[0]].append(edge[1])
+    adjacency[edge[1]].append(edge[0])
+  
+  # Find branch points (degree > 2) and boundary vertices
+  branch_points = []
+  boundary_vertices = find_boundary_vertices(vertices, chunk_bbox)
+  
+  for vertex_idx, neighbors in adjacency.items():
+    if len(neighbors) > 2:
+      branch_points.append(vertex_idx)
+  
+  # If no branch points, return single fragment with boundary info
+  if len(branch_points) == 0:
+    boundary_info = {
+      'boundary_vertices': boundary_vertices,
+      'chunk_bbox': chunk_bbox.to_list(),
+      'connections': []
+    }
+    return [(skeleton, boundary_info)]
+  
+  # Split at branch points and create fragments with boundary tracking
+  fragments_with_info = []
+  visited_edges = set()
+  fragment_id = 0
+  
+  for branch_point in branch_points:
+    neighbors = adjacency[branch_point]
+    
+    for neighbor in neighbors:
+      if (branch_point, neighbor) in visited_edges or (neighbor, branch_point) in visited_edges:
+        continue
+        
+      # Trace path from branch point
+      path_vertices = [branch_point, neighbor]
+      current = neighbor
+      visited_edges.add((branch_point, neighbor))
+      visited_edges.add((neighbor, branch_point))
+      
+      while True:
+        current_neighbors = [n for n in adjacency[current] if n not in path_vertices]
+        if len(current_neighbors) != 1:
+          break
+        next_vertex = current_neighbors[0]
+        path_vertices.append(next_vertex)
+        visited_edges.add((current, next_vertex))
+        visited_edges.add((next_vertex, current))
+        current = next_vertex
+      
+      if len(path_vertices) >= 2:
+        # Create fragment
+        fragment_vertices = vertices[path_vertices]
+        fragment_edges = []
+        for i in range(len(path_vertices) - 1):
+          fragment_edges.append([i, i + 1])
+        
+        fragment = Skeleton(
+          vertices=fragment_vertices,
+          edges=np.array(fragment_edges, dtype=np.uint32) if fragment_edges else np.array([], dtype=np.uint32).reshape(0, 2),
+          radii=skeleton.radii[path_vertices] if skeleton.radii is not None and len(skeleton.radii) > 0 else None,
+          vertex_types=skeleton.vertex_types[path_vertices] if skeleton.vertex_types is not None and len(skeleton.vertex_types) > 0 else None,
+          extra_attributes=[],
+          segid=skeleton.id,
+          space='voxel'
+        )
+        
+        # Create unique fragment ID
+        fragment.id = f"{skeleton.id}_{fragment_id}"
+        fragment_id += 1
+        
+        # Track boundary information for this fragment
+        fragment_boundary_vertices = find_boundary_vertices(fragment_vertices, chunk_bbox)
+        
+        # Track connections to other fragments (for merge reconstruction)
+        connections = []
+        if path_vertices[0] in branch_points:  # Start at branch point
+          connections.append({
+            'vertex_idx': 0,
+            'connects_to': 'branch',
+            'branch_vertex': vertices[path_vertices[0]].tolist()
+          })
+        if path_vertices[-1] in branch_points:  # End at branch point
+          connections.append({
+            'vertex_idx': len(path_vertices) - 1,
+            'connects_to': 'branch',
+            'branch_vertex': vertices[path_vertices[-1]].tolist()
+          })
+        
+        boundary_info = {
+          'boundary_vertices': fragment_boundary_vertices,
+          'chunk_bbox': chunk_bbox.to_list(),
+          'connections': connections,
+          'original_segment_id': skeleton.id,
+          'fragment_id': fragment.id
+        }
+        
+        fragments_with_info.append((fragment, boundary_info))
+  
+  return fragments_with_info if fragments_with_info else [(skeleton, {'boundary_vertices': boundary_vertices, 'chunk_bbox': chunk_bbox.to_list(), 'connections': []})]
+
+def find_boundary_vertices(vertices, chunk_bbox):
+  """Find vertices that are on or near chunk boundaries."""
+  boundary_vertices = []
+  tolerance = 1.0  # 1 voxel tolerance
+  
+  for i, vertex in enumerate(vertices):
+    x, y, z = vertex
+    minx, miny, minz = chunk_bbox.minpt
+    maxx, maxy, maxz = chunk_bbox.maxpt
+    
+    # Check if vertex is within tolerance of any boundary
+    if (abs(x - minx) <= tolerance or abs(x - maxx) <= tolerance or
+        abs(y - miny) <= tolerance or abs(y - maxy) <= tolerance or
+        abs(z - minz) <= tolerance or abs(z - maxz) <= tolerance):
+      boundary_vertices.append({
+        'vertex_idx': i,
+        'vertex_pos': vertex.tolist(),
+        'boundary_faces': []
+      })
+      
+      # Track which faces this vertex is near
+      if abs(x - minx) <= tolerance:
+        boundary_vertices[-1]['boundary_faces'].append('x_min')
+      if abs(x - maxx) <= tolerance:
+        boundary_vertices[-1]['boundary_faces'].append('x_max')
+      if abs(y - miny) <= tolerance:
+        boundary_vertices[-1]['boundary_faces'].append('y_min')
+      if abs(y - maxy) <= tolerance:
+        boundary_vertices[-1]['boundary_faces'].append('y_max')
+      if abs(z - minz) <= tolerance:
+        boundary_vertices[-1]['boundary_faces'].append('z_min')
+      if abs(z - maxz) <= tolerance:
+        boundary_vertices[-1]['boundary_faces'].append('z_max')
+  
+  return boundary_vertices
+
+class FragmentAwareSkeletonMergeTask(RegisteredTask):
+  """
+  Modified merge task that handles pre-split skeleton fragments.
+  Reconstructs skeletons by connecting fragments across chunk boundaries
+  while maintaining branch point splits.
+  """
+  def __init__(
+    self, cloudpath, shard_no, 
+    dust_threshold=4000, tick_threshold=6000, frag_path=None, cache=False,
+    spatial_index_db=None, max_cable_length=None, target_segment_id=None
+  ):
+    super(FragmentAwareSkeletonMergeTask, self).__init__(
+      cloudpath, shard_no,  
+      dust_threshold, tick_threshold, frag_path, cache, spatial_index_db,
+      max_cable_length, target_segment_id
+    )
+    self.progress = False
+    self.max_cable_length = float(max_cable_length) if max_cable_length is not None else None
+    self.target_segment_id = target_segment_id
+
+  def execute(self):
+    cv = CloudVolume(
+      self.cloudpath, 
+      progress=self.progress,
+      spatial_index_db=self.spatial_index_db,
+      cache=self.cache
+    )
+
+    # Get fragments for the target segment
+    fragment_locations = self.get_fragment_locations_for_segment(cv, self.target_segment_id)
+    
+    # Load fragments and boundary information
+    fragments_with_boundaries = self.load_fragments_with_boundaries(cv, fragment_locations)
+    
+    # Process fragments in batches to manage memory
+    connected_components = self.connect_fragments_across_boundaries(fragments_with_boundaries)
+    
+    # Create final skeleton trees (one per connected component)
+    final_skeletons = {}
+    for comp_id, component_fragments in connected_components.items():
+      if len(component_fragments) > 0:
+        # Each connected component becomes a separate skeleton tree
+        merged_skeleton = self.merge_connected_fragments(component_fragments)
+        final_skeletons[f"{self.target_segment_id}_{comp_id}"] = merged_skeleton
+
+    if len(final_skeletons) == 0:
+      return
+
+    # Store results
+    shard_files = synthesize_shard_files(cv.skeleton.reader.spec, final_skeletons)
+    cf = CloudFiles(cv.skeleton.meta.layerpath, progress=self.progress)
+    cf.puts( 
+      ( (fname, data) for fname, data in shard_files.items() ),
+      compress=False,
+      content_type='application/octet-stream',
+      cache_control='no-cache',      
+    )
+
+  def get_fragment_locations_for_segment(self, cv, segment_id):
+    """Find all chunks containing fragments of the target segment."""
+    all_locations = []
+    
+    # Query all spatial index files to find fragment locations
+    # This would need to be implemented based on your specific setup
+    # For now, assuming you have a way to query fragment locations
+    
+    return all_locations
+
+  def load_fragments_with_boundaries(self, cv, fragment_locations):
+    """Load fragments and their boundary information."""
+    fragments_with_boundaries = []
+    
+    for location in fragment_locations:
+      try:
+        # Load fragment
+        fragment_file = CloudFile(cv.meta.join(cv.cloudpath, location))
+        fragment = pickle.loads(fragment_file.get())
+        
+        # Load boundary information
+        boundary_file = CloudFile(cv.meta.join(cv.cloudpath, location + ".boundary"))
+        boundary_info = pickle.loads(boundary_file.get())
+        
+        fragments_with_boundaries.append((fragment, boundary_info))
+      except Exception as e:
+        print(f"Error loading fragment {location}: {e}")
+        continue
+    
+    return fragments_with_boundaries
+
+  def connect_fragments_across_boundaries(self, fragments_with_boundaries):
+    """
+    Group fragments into connected components based on boundary connections.
+    Fragments that connect across chunk boundaries are grouped together.
+    """
+    from collections import defaultdict
+    import networkx as nx
+    
+    # Build connectivity graph
+    G = nx.Graph()
+    fragment_map = {}
+    
+    for i, (fragment, boundary_info) in enumerate(fragments_with_boundaries):
+      fragment_id = fragment.id
+      G.add_node(fragment_id)
+      fragment_map[fragment_id] = (fragment, boundary_info)
+      
+      # Connect fragments that share boundary vertices
+      for other_i, (other_fragment, other_boundary_info) in enumerate(fragments_with_boundaries):
+        if i >= other_i:
+          continue
+          
+        if self.fragments_connect_at_boundary(boundary_info, other_boundary_info):
+          G.add_edge(fragment_id, other_fragment.id)
+    
+    # Find connected components
+    connected_components = {}
+    for comp_id, component in enumerate(nx.connected_components(G)):
+      connected_components[comp_id] = [
+        fragment_map[frag_id] for frag_id in component
+      ]
+    
+    return connected_components
+
+  def fragments_connect_at_boundary(self, boundary_info1, boundary_info2):
+    """Check if two fragments connect at chunk boundaries."""
+    tolerance = 2.0  # voxel tolerance for boundary matching
+    
+    for bv1 in boundary_info1.get('boundary_vertices', []):
+      for bv2 in boundary_info2.get('boundary_vertices', []):
+        pos1 = np.array(bv1['vertex_pos'])
+        pos2 = np.array(bv2['vertex_pos'])
+        
+        if np.linalg.norm(pos1 - pos2) <= tolerance:
+          # Check if they're on adjacent chunk boundaries
+          faces1 = set(bv1['boundary_faces'])
+          faces2 = set(bv2['boundary_faces'])
+          
+          # Adjacent faces (e.g., x_max connects to x_min)
+          adjacent_pairs = [
+            ('x_max', 'x_min'), ('x_min', 'x_max'),
+            ('y_max', 'y_min'), ('y_min', 'y_max'),
+            ('z_max', 'z_min'), ('z_min', 'z_max')
+          ]
+          
+          for face1 in faces1:
+            for face2 in faces2:
+              if (face1, face2) in adjacent_pairs:
+                return True
+    
+    return False
+
+  def merge_connected_fragments(self, component_fragments):
+    """Merge fragments in a connected component into a single skeleton."""
+    fragments = [frag for frag, _ in component_fragments]
+    
+    # Use simple merge for now - could be optimized for better branch handling
+    if len(fragments) == 1:
+      return fragments[0]
+    
+    # Batch merge to control memory usage
+    batch_size = 50
+    while len(fragments) > 1:
+      next_batch = []
+      for i in range(0, len(fragments), batch_size):
+        batch = fragments[i:i + batch_size]
+        if len(batch) == 1:
+          next_batch.append(batch[0])
+        else:
+          merged = Skeleton.simple_merge(batch)
+          next_batch.append(merged)
+      fragments = next_batch
+    
+    return fragments[0]
diff --git a/igneous/tasks/skeleton_ori.py b/igneous/tasks/skeleton_ori.py
new file mode 100644
index 00000000..f3261076
--- /dev/null
+++ b/igneous/tasks/skeleton_ori.py
@@ -0,0 +1,914 @@
+from typing import Optional, Sequence, Dict, List
+
+from functools import reduce
+import itertools
+import json
+import mmap
+import pickle
+import posixpath
+import os
+import re
+from collections import defaultdict
+
+from tqdm import tqdm
+
+import numpy as np
+
+import mapbuffer
+from mapbuffer import MapBuffer, IntMap
+import cloudfiles
+from cloudfiles import CloudFiles, CloudFile
+
+import cloudvolume
+from cloudvolume import CloudVolume, Skeleton, paths
+from cloudvolume.lib import Vec, Bbox, sip, xyzrange
+from cloudvolume.datasource.precomputed.sharding import synthesize_shard_files
+
+import cc3d
+import crackle
+import fastmorph
+import fastremap
+import kimimaro
+
+from taskqueue import RegisteredTask, queueable
+
+SEGIDRE = re.compile(r'/(\d+):.*?$')
+
+def filename_to_segid(filename):
+  matches = SEGIDRE.search(filename)
+  if matches is None:
+    raise ValueError("There was an issue with the fragment filename: " + filename)
+
+  segid, = matches.groups()
+  return int(segid)
+
+def strip_integer_attributes(skeletons):
+  for skel in skeletons:
+    skel.extra_attributes = [ 
+    attr for attr in skel.extra_attributes 
+    if attr['data_type'] in ('float32', 'float64')
+  ]
+  return skeletons
+
+class SkeletonTask(RegisteredTask):
+  """
+  Stage 1 of skeletonization.
+
+  Convert chunks of segmentation into chunked skeletons and point clouds.
+  They will be merged in the stage 2 task SkeletonMergeTask.
+  """
+  def __init__(
+    self, cloudpath:str, 
+    shape:Sequence[int], offset:Sequence[int], 
+    mip:int, teasar_params:dict, will_postprocess:bool,
+    info:dict = None, 
+    object_ids:Optional[Sequence[int]] = None,
+    mask_ids:Optional[Sequence[int]] = None,
+    fix_branching:bool = True,
+    fix_borders:bool = True,
+    fix_avocados:bool = False,
+    fill_holes:int = 0,
+    dust_threshold:int = 1000, 
+    progress:bool = False,
+    parallel:int = 1,
+    fill_missing:bool = False,
+    sharded:bool = False,
+    frag_path:Optional[str] = None, 
+    spatial_index:bool = True,
+    spatial_grid_shape:Optional[Sequence[int]] = None,
+    synapses:Optional[Sequence[Sequence[float]]] = None, 
+    dust_global:bool = False,
+    cross_sectional_area:bool = False,
+    cross_sectional_area_smoothing_window:int = 1,
+    cross_sectional_area_shape_delta:int = 150,
+    dry_run:bool = False,
+    strip_integer_attributes:bool = True,
+    fix_autapses:bool = False,
+    timestamp:Optional[int] = None,
+    root_ids_cloudpath:Optional[str] = None,
+  ):
+    super().__init__(
+      cloudpath, shape, offset, mip, 
+      teasar_params, will_postprocess, 
+      info, object_ids, mask_ids,
+      fix_branching, fix_borders, 
+      fix_avocados, fill_holes,
+      dust_threshold, progress, parallel,
+      fill_missing, bool(sharded), frag_path, bool(spatial_index),
+      spatial_grid_shape, synapses, bool(dust_global),
+      bool(cross_sectional_area), int(cross_sectional_area_smoothing_window),
+      int(cross_sectional_area_shape_delta),
+      bool(dry_run), bool(strip_integer_attributes),
+      bool(fix_autapses), timestamp,
+      root_ids_cloudpath,
+    )
+    if isinstance(self.frag_path, str):
+      self.frag_path = cloudfiles.paths.normalize(self.frag_path)
+    self.bounds = Bbox(offset, Vec(*shape) + Vec(*offset))
+    self.index_bounds = Bbox(offset, Vec(*spatial_grid_shape) + Vec(*offset))
+
+    # aggressive morphological hole filling has a 1-2vx 
+    # edge effect that needs to be cropped away
+    self.hole_filling_padding = (self.fill_holes >= 3) * 2
+
+  def execute(self):
+    # For graphene volumes, if we've materialized the root IDs
+    # into a static archive, let's use that because it's way more
+    # efficient for fetching root IDs.
+    cloudpath = self.cloudpath
+    if self.root_ids_cloudpath:
+      cloudpath = self.root_ids_cloudpath
+
+    lru_bytes = 0
+    lru_encoding = 'same'
+
+    if self.cross_sectional_area:
+      lru_bytes = self.bounds.size() + 2 * self.cross_sectional_area_shape_delta
+      lru_bytes = lru_bytes[0] * lru_bytes[1] * lru_bytes[2] * 8 // 500
+      lru_encoding = 'crackle'
+
+    vol = CloudVolume(
+      cloudpath,
+      mip=self.mip,
+      bounded=(self.hole_filling_padding == 0),
+      info=self.info,
+      cdn_cache=False,
+      parallel=self.parallel,
+      fill_missing=self.fill_missing,
+      lru_bytes=lru_bytes,
+      lru_encoding=lru_encoding,
+    )
+    bbox = Bbox.clamp(self.bounds, vol.bounds)
+    index_bbox = Bbox.clamp(self.index_bounds, vol.bounds)
+
+    bbox.minpt -= self.hole_filling_padding
+    bbox.maxpt += self.hole_filling_padding
+
+    path = vol.info.get("skeletons", "skeletons")
+    if self.frag_path is None:
+      path = vol.meta.join(self.cloudpath, path)
+    else:
+      # if the path is to a volume root, follow the info instructions,
+      # otherwise place the files exactly where frag path says to
+      test_path = CloudFiles(self.frag_path).join(self.frag_path, "info")
+      test_info = CloudFile(test_path).get_json()
+      if test_info is not None and 'scales' in test_info:
+        path = CloudFiles(self.frag_path).join(self.frag_path, path)
+      else:
+        path = self.frag_path
+
+    all_labels = vol.download(
+      bbox.to_slices(), 
+      agglomerate=True, 
+      timestamp=self.timestamp
+    )
+    all_labels = all_labels[:,:,:,0]
+
+    if self.mask_ids:
+      all_labels = fastremap.mask(all_labels, self.mask_ids)
+
+    extra_targets_after = {}
+    if self.synapses:
+      extra_targets_after = kimimaro.synapses_to_targets(
+        all_labels, self.synapses
+      )
+
+    dust_threshold = self.dust_threshold
+    if self.dust_global and dust_threshold > 0:
+      dust_threshold = 0
+      all_labels = self.apply_global_dust_threshold(vol, all_labels)
+
+    if self.fill_holes and self.fix_autapses:
+      raise ValueError("fill_holes is not currently compatible with fix_autapses")
+
+    voxel_graph = None
+    if self.fix_autapses:
+      voxel_graph = self.voxel_connectivity_graph(vol, bbox, all_labels)
+
+    skeletons = self.skeletonize(
+      all_labels, 
+      vol, 
+      dust_threshold, 
+      extra_targets_after, 
+      voxel_graph,
+    )
+    del all_labels
+
+    if self.cross_sectional_area: # This is expensive!
+      skeletons = self.compute_cross_sectional_area(vol, bbox, skeletons)
+
+    # voxel centered (+0.5) and uses more accurate bounding box from mip 0
+    corrected_offset = (bbox.minpt.astype(np.float32) - vol.meta.voxel_offset(self.mip) + 0.5) * vol.meta.resolution(self.mip)
+    corrected_offset += vol.meta.voxel_offset(0) * vol.meta.resolution(0)
+
+    for segid, skel in skeletons.items():
+      skel.vertices[:] += corrected_offset
+
+    if self.synapses:
+      for segid, skel in skeletons.items():
+        terminal_nodes = skel.vertices[ skel.terminals() ]
+
+        for i, vert in enumerate(terminal_nodes):
+          vert = vert / vol.resolution - self.bounds.minpt
+          vert = tuple(np.round(vert).astype(int))
+          if vert in extra_targets_after.keys():
+            skel.vertex_types[i] = extra_targets_after[vert]
+    
+    # old versions of neuroglancer don't
+    # support int attributes
+    if self.strip_integer_attributes:
+      strip_integer_attributes(skeletons.values())
+
+    if self.dry_run:
+      return skeletons
+
+    if self.sharded:
+      self.upload_batch(vol, path, index_bbox, skeletons)
+    else:
+      self.upload_individuals(vol, path, bbox, skeletons)
+
+    if self.spatial_index:
+      self.upload_spatial_index(vol, path, index_bbox, skeletons)
+
+  def _do_operation(self, all_labels, fn):
+    if self.fill_holes > 0:
+      filled_labels, hole_labels = fastmorph.fill_holes(
+        all_labels,
+        remove_enclosed=True,
+        return_removed=True,
+        fix_borders=(self.fill_holes >= 2),
+        morphological_closing=(self.fill_holes >= 3),
+      )
+
+      if self.fill_holes >= 3:
+        hp = self.hole_filling_padding
+        all_labels = np.asfortranarray(all_labels[hp:-hp,hp:-hp,hp:-hp])
+        filled_labels= np.asfortranarray(filled_labels[hp:-hp,hp:-hp,hp:-hp])
+
+      all_labels = crackle.compress(all_labels)
+      skeletons = fn(filled_labels)
+      del filled_labels
+
+      all_labels = crackle.decompress(all_labels)
+      hole_labels = all_labels * np.isin(all_labels, list(hole_labels))
+      del all_labels
+
+      hole_skeletons = fn(hole_labels)
+      skeletons.update(hole_skeletons)
+      del hole_labels
+      del hole_skeletons
+    else:
+      skeletons = fn(all_labels)
+
+    return skeletons
+
+  def skeletonize(
+    self, 
+    all_labels:np.ndarray, 
+    vol:CloudVolume, 
+    dust_threshold:int, 
+    extra_targets_after:dict, 
+    voxel_graph:np.ndarray,
+  ) -> dict:
+    def do_skeletonize(labels):
+      return kimimaro.skeletonize(
+        labels, self.teasar_params, 
+        object_ids=self.object_ids, 
+        anisotropy=vol.resolution,
+        dust_threshold=dust_threshold, 
+        progress=self.progress, 
+        fix_branching=self.fix_branching,
+        fix_borders=self.fix_borders,
+        fix_avocados=self.fix_avocados,
+        fill_holes=False, # moved this logic into SkeletonTask / fastmorph
+        parallel=self.parallel,
+        extra_targets_after=extra_targets_after.keys(),
+        voxel_graph=voxel_graph,
+      )
+
+    return self._do_operation(all_labels, do_skeletonize)
+
+  def voxel_connectivity_graph(
+    self, 
+    vol:CloudVolume, 
+    bbox:Bbox, 
+    root_labels:np.ndarray,
+  ) -> np.ndarray:
+
+    if vol.meta.path.format != "graphene":
+      vol = CloudVolume(
+        self.cloudpath, mip=self.mip, 
+        info=self.info, cdn_cache=False,
+        parallel=self.parallel, 
+        fill_missing=self.fill_missing,
+      )
+
+    if vol.meta.path.format != "graphene":
+      raise ValueError("Can't extract a voxel connectivity graph from non-graphene volumes.")
+
+    layer_2 = vol.download(
+      bbox, 
+      stop_layer=2,
+      agglomerate=True,
+      timestamp=self.timestamp,
+    )[...,0]
+
+    graph_chunk_size = np.array(vol.meta.graph_chunk_size) / vol.meta.downsample_ratio(vol.mip)
+    graph_chunk_size = graph_chunk_size.astype(int)
+
+    shape = bbox.size()[:3]
+    sgx, sgy, sgz = list(np.ceil(shape / graph_chunk_size).astype(int))
+
+    vcg = cc3d.voxel_connectivity_graph(layer_2, connectivity=26)
+    del layer_2
+
+    # the proper way to do this would be to get the lowest the L3..LN root
+    # as needed, but the lazy way to do this is to get the root labels
+    # which will retain a few errors, but overall the error rate should be
+    # over 100x less. We need to shade in the sides of the connectivity graph
+    # with edges that represent the connections between the adjacent boxes.
+
+    root_vcg = cc3d.voxel_connectivity_graph(root_labels, connectivity=26)
+    clamp_box = Bbox([0,0,0], shape)
+
+    for gx,gy,gz in xyzrange([sgx, sgy, sgz]):
+      bbx = Bbox((gx,gy,gz), (gx+1, gy+1, gz+1))
+      bbx *= graph_chunk_size
+      bbx = Bbox.clamp(bbx, clamp_box)
+
+      slicearr = []
+      for i in range(3):
+        bbx1 = bbx.clone()
+        bbx1.maxpt[i] = bbx1.minpt[i] + 1
+        slicearr.append(bbx1)
+
+        bbx1 = bbx.clone()
+        bbx1.minpt[i] = bbx1.maxpt[i] - 1
+        slicearr.append(bbx1)
+
+      for bbx1 in slicearr:
+        vcg[bbx1.to_slices()] = root_vcg[bbx1.to_slices()] 
+
+    return vcg
+
+  def compute_cross_sectional_area(self, vol, bbox, skeletons):
+    if len(skeletons) == 0:
+      return skeletons
+
+    # Why redownload a bigger image? In order to avoid clipping the
+    # cross sectional areas on the edges.
+    delta = int(self.cross_sectional_area_shape_delta)
+
+    big_bbox = bbox.clone()
+    big_bbox.grow(delta)
+    big_bbox = Bbox.clamp(big_bbox, vol.bounds)
+
+    big_bbox.minpt -= self.hole_filling_padding
+    big_bbox.maxpt += self.hole_filling_padding
+
+    all_labels = vol[big_bbox][...,0]
+
+    delta = bbox.minpt - big_bbox.minpt
+
+    # place the skeletons in exactly the same position
+    # in the enlarged image
+    for skel in skeletons.values():
+      skel.vertices += delta * vol.resolution
+
+    if self.mask_ids:
+      all_labels = fastremap.mask(all_labels, self.mask_ids)
+
+    def do_cross_section(labels):
+      return kimimaro.cross_sectional_area(
+        labels, skeletons,
+        anisotropy=vol.resolution,
+        smoothing_window=self.cross_sectional_area_smoothing_window,
+        progress=self.progress,
+        in_place=True,
+        fill_holes=False,
+      )
+
+    skeletons = self._do_operation(all_labels, do_cross_section)
+    del all_labels
+
+    # move the vertices back to their old smaller image location
+    for skel in skeletons.values():
+      skel.vertices -= delta * vol.resolution
+
+    return self.repair_cross_sectional_area_contacts(vol, bbox, skeletons)
+
+  def repair_cross_sectional_area_contacts(self, vol, bbox, skeletons):
+    from dbscan import DBSCAN
+
+    boundaries = [
+      bbox.minpt.x == vol.bounds.minpt.x,
+      bbox.maxpt.x == vol.bounds.maxpt.x,
+      bbox.minpt.y == vol.bounds.minpt.y,
+      bbox.maxpt.y == vol.bounds.maxpt.y,
+      bbox.minpt.z == vol.bounds.minpt.z,
+      bbox.maxpt.z == vol.bounds.maxpt.z,
+    ]
+
+    if all(boundaries):
+      return skeletons
+
+    invalid_repairs = 0
+    for i, bnd in enumerate(boundaries):
+      invalid_repairs |= (bnd << i)
+
+    invalid_repairs = (~np.uint8(invalid_repairs)) & np.uint8(0b00111111)
+
+    # We want to repair any skeleton that has a contact with the
+    # edge except those that are contacting the volume boundary due to futility
+
+    repair_skels = []
+    for skel in skeletons.values():
+      contacts = skel.cross_sectional_area_contacts & invalid_repairs
+      if np.any(contacts):
+        repair_skels.append(skel)
+
+    delta = int(self.cross_sectional_area_shape_delta)
+
+    shape = bbox.size3()
+    
+    def reprocess_skel(pts, skel):
+      pts_bbx = Bbox.from_points(pts)
+
+      pts_bbx_vol = pts_bbx + bbox.minpt
+      center = pts_bbx_vol.center().astype(int)
+      skel_bbx = Bbox(center, center+1)
+      skel_bbx.grow(delta + shape // 2)
+
+      skel_bbx = Bbox.clamp(skel_bbx, vol.bounds)
+
+      skel_bbx.minpt -= self.hole_filling_padding
+      skel_bbx.maxpt += self.hole_filling_padding
+
+      binary_image = vol.download(
+        skel_bbx, mip=vol.mip, label=skel.id
+      )[...,0]
+
+      diff = bbox.minpt - skel_bbx.minpt
+      skel.vertices += diff * vol.resolution
+
+      # we binarized the label for memory's sake, 
+      # so need to harmonize that with the skeleton ID
+      segid = skel.id
+      skel.id = 1
+
+      if self.fill_holes > 0:
+        binary_image = fastmorph.fill_holes(
+          binary_image,
+          fix_borders=(self.fill_holes >= 2),
+          morphological_closing=(self.fill_holes >= 3),
+        )
+        if self.fill_holes >= 3:
+          hp = self.hole_filling_padding
+          binary_image = np.asfortranarray(binary_image[hp:-hp,hp:-hp,hp:-hp])
+
+      kimimaro.cross_sectional_area(
+        binary_image, skel,
+        anisotropy=vol.resolution,
+        smoothing_window=self.cross_sectional_area_smoothing_window,
+        progress=self.progress,
+        in_place=True,
+        fill_holes=False,
+        repair_contacts=True,
+      )
+      skel.id = segid
+      skel.vertices -= diff * vol.resolution
+
+    for skel in repair_skels:
+      verts = (skel.vertices // vol.resolution).astype(int)
+      reprocess_skel(verts, skel)
+
+      pts = verts[skel.cross_sectional_area_contacts > 0]
+      if len(pts) == 0:
+        continue
+
+      labels, core_samples_mask = DBSCAN(pts, eps=5, min_samples=2)
+      uniq = fastremap.unique(labels)
+      for lbl in uniq:
+        reprocess_skel(pts[labels == lbl], skel)
+
+    return skeletons
+
+  def apply_global_dust_threshold(self, vol, all_labels):
+    path = vol.meta.join(self.cloudpath, vol.key, 'stats', 'voxel_counts.im')
+    cf = CloudFile(path)
+    memcf = CloudFile(path.replace(f"{cf.protocol}://", "mem://"))
+
+    if not cf.exists():
+      raise FileNotFoundError(f"Cannot apply global dust threshold without {path}")
+
+    buf = None
+    if memcf.exists():
+      buf = memcf.get()
+    else:
+      cloudfiles.clear_memory()
+
+    if buf is None:
+      if cf.protocol != "file":
+        buf = cf.get()
+        memcf.put(buf, compress='zstd')
+      else:
+        buf = cf
+
+    mb = IntMap(buf)
+    uniq = fastremap.unique(all_labels)
+
+    valid_objects = []
+    for label in uniq:
+      if label == 0:
+        continue
+      if mb[label] >= self.dust_threshold:
+        valid_objects.append(label)
+
+    return fastremap.mask_except(all_labels, valid_objects)
+
+  def upload_batch(self, vol, path, bbox, skeletons):
+    mbuf = MapBuffer(
+      skeletons, compress="br", 
+      tobytesfn=lambda skel: skel.to_precomputed()
+    )
+
+    cf = CloudFiles(path, progress=vol.progress)
+    cf.put(
+      path="{}.frags".format(bbox.to_filename()),
+      content=mbuf.tobytes(),
+      compress=None,
+      content_type="application/x-mapbuffer",
+      cache_control=False,
+    )
+
+  def upload_individuals(self, vol, path, bbox, skeletons):
+    skeletons = skeletons.values()
+
+    if not self.will_postprocess:
+      vol.skeleton.upload(skeletons)
+      return 
+
+    bbox = bbox * vol.resolution
+    cf = CloudFiles(path, progress=vol.progress)
+    cf.puts(
+      (
+        (
+          f"{skel.id}:{bbox.to_filename()}",
+          pickle.dumps(skel)
+        )
+        for skel in skeletons
+      ),
+      compress='gzip',
+      content_type="application/python-pickle",
+      cache_control=False,
+    )
+
+  def upload_spatial_index(self, vol, path, bbox, skeletons):
+    spatial_index = {}
+    for segid, skel in tqdm(skeletons.items(), disable=(not vol.progress), desc="Extracting Bounding Boxes"):
+      segid_bbx = Bbox.from_points( skel.vertices )
+      spatial_index[segid] = segid_bbx.to_list()
+
+    bbox = bbox.astype(vol.resolution.dtype) * vol.resolution
+    precision = vol.skeleton.spatial_index.precision
+    cf = CloudFiles(path, progress=vol.progress)
+    cf.put_json(
+      path=f"{bbox.to_filename(precision)}.spatial",
+      content=spatial_index,
+      compress='gzip',
+      cache_control=False,
+    )
+
+class UnshardedSkeletonMergeTask(RegisteredTask):
+  """
+  Stage 2 of skeletonization.
+
+  Merge chunked TEASAR skeletons into a single skeleton.
+
+  If we parallelize using prefixes single digit prefixes ['0','1',..'9'] all meshes will
+  be correctly processed. But if we do ['10','11',..'99'] meshes from [0,9] won't get
+  processed and need to be handle specifically by creating tasks that will process
+  a single mesh ['0:','1:',..'9:']
+  """
+  def __init__(
+      self, cloudpath, prefix, 
+      crop=0, dust_threshold=4000, max_cable_length=None,
+      tick_threshold=6000, delete_fragments=False
+    ):
+    super(UnshardedSkeletonMergeTask, self).__init__(
+      cloudpath, prefix, crop, 
+      dust_threshold, max_cable_length,
+      tick_threshold, delete_fragments
+    )
+    self.max_cable_length = float(max_cable_length) if max_cable_length is not None else None
+
+  def execute(self):
+    self.vol = CloudVolume(self.cloudpath, cdn_cache=False)
+    self.vol.mip = self.vol.skeleton.meta.mip
+
+    fragment_filenames = self.get_filenames()
+    skels = self.get_skeletons_by_segid(fragment_filenames)
+
+    skeletons = []
+    for segid, frags in skels.items():
+      skeleton = self.fuse_skeletons(frags)
+      # if self.max_cable_length is None or skeleton.cable_length() <= self.max_cable_length:
+      #   skeleton = kimimaro.postprocess(
+      #     skeleton, self.dust_threshold, self.tick_threshold
+      #   )
+      skeleton.id = segid
+      skeletons.append(skeleton)
+
+    self.vol.skeleton.upload(skeletons)
+    
+    if self.delete_fragments:
+      cf = CloudFiles(self.cloudpath, progress=True)
+      cf.delete(fragment_filenames)
+
+  def get_filenames(self):
+    prefix = '{}/{}'.format(self.vol.skeleton.path, self.prefix)
+
+    cf = CloudFiles(self.cloudpath, progress=True)
+    return [ _ for _ in cf.list(prefix=prefix) ]
+
+  def get_skeletons_by_segid(self, filenames):
+    cf = CloudFiles(self.cloudpath, progress=False)
+    skels = cf.get(filenames)
+
+    skeletons = defaultdict(list)
+    for skel in skels:
+      try:
+        segid = filename_to_segid(skel['path'])
+      except ValueError:
+        # Typically this is due to preexisting fully
+        # formed skeletons e.g. skeletons_mip_3/1588494
+        continue
+
+      skeletons[segid].append( 
+        (
+          Bbox.from_filename(skel['path']),
+          pickle.loads(skel['content'])
+        )
+      )
+
+    return skeletons
+
+  def fuse_skeletons(self, skels):
+    if len(skels) == 0:
+      return Skeleton()
+
+    bbxs = [ item[0] for item in skels ]
+    skeletons = [ item[1] for item in skels ]
+
+    skeletons = self.crop_skels(bbxs, skeletons)
+    skeletons = [ s for s in skeletons if not s.empty() ]
+
+    if len(skeletons) == 0:
+      return Skeleton()
+
+    return Skeleton.simple_merge(skeletons).consolidate()
+
+  def crop_skels(self, bbxs, skeletons):
+    cropped = [ s.clone() for s in skeletons ]
+
+    if self.crop <= 0:
+      return cropped
+    
+    for i in range(len(skeletons)):
+      bbx = bbxs[i]
+      bbx = bbx.astype(self.vol.resolution.dtype) 
+      bbx.minpt += self.crop * self.vol.resolution
+      bbx.maxpt -= self.crop * self.vol.resolution
+
+      if bbx.volume() <= 0:
+        continue
+
+      cropped[i] = cropped[i].crop(bbx)
+
+    return cropped
+
+class ShardedSkeletonMergeTask(RegisteredTask):
+  def __init__(
+    self, cloudpath, shard_no, 
+    dust_threshold=4000, tick_threshold=6000, frag_path=None, cache=False,
+    spatial_index_db=None, max_cable_length=None
+  ):
+    super(ShardedSkeletonMergeTask, self).__init__(
+      cloudpath, shard_no,  
+      dust_threshold, tick_threshold, frag_path, cache, spatial_index_db,
+      max_cable_length
+    )
+    self.progress = False
+    self.max_cable_length = float(max_cable_length) if max_cable_length is not None else None
+
+  def execute(self):
+    # cache is necessary for local computation, but on GCE download is very fast
+    # so cache isn't necessary.
+    cv = CloudVolume(
+      self.cloudpath, 
+      progress=self.progress,
+      spatial_index_db=self.spatial_index_db,
+      cache=self.cache
+    )
+
+    # This looks messy because we are trying to avoid retaining
+    # unnecessary memory. In the original iteration, this was 
+    # using 50 GB+ memory on minnie65. With changes to this
+    # and the spatial_index, we are getting it down to something reasonable.
+    locations = self.locations_for_labels(
+      labels_for_shard(cv, self.shard_no, self.progress), 
+      cv
+    )
+    filenames = set(itertools.chain(*locations.values()))
+    labels = set(locations.keys())
+    del locations
+    skeletons = self.get_unfused(labels, filenames, cv, self.frag_path)
+    del labels
+    del filenames
+    skeletons = self.process_skeletons(skeletons, in_place=True)
+
+    if len(skeletons) == 0:
+      return
+
+    shard_files = synthesize_shard_files(cv.skeleton.reader.spec, skeletons)
+
+    if len(shard_files) != 1:
+      raise ValueError(
+        "Only one shard file should be generated per task. Expected: {} Got: {} ".format(
+          str(self.shard_no), ", ".join(shard_files.keys())
+      ))
+
+    cf = CloudFiles(cv.skeleton.meta.layerpath, progress=self.progress)
+    cf.puts( 
+      ( (fname, data) for fname, data in shard_files.items() ),
+      compress=False,
+      content_type='application/octet-stream',
+      cache_control='no-cache',      
+    )
+
+  def process_skeletons(self, unfused_skeletons, in_place=False):
+    skeletons = {}
+    if in_place:
+      skeletons = unfused_skeletons
+
+    for label in tqdm(unfused_skeletons.keys(), desc="Postprocessing", disable=(not self.progress)):
+      skels = unfused_skeletons[label]
+      skel = Skeleton.simple_merge(skels)
+      skel.id = label
+      skel.extra_attributes = [ 
+        attr for attr in skel.extra_attributes \
+        if attr['data_type'] == 'float32' 
+      ]
+      skel = skel.consolidate()
+      # if self.max_cable_length is not None and skel.cable_length() > self.max_cable_length:
+      #   skeletons[label] = skel.to_precomputed()
+      # else:
+      #   skeletons[label] = kimimaro.postprocess(
+      #     skel, 
+      #     dust_threshold=self.dust_threshold, # voxels 
+      #     tick_threshold=self.tick_threshold, # nm
+      #   ).to_precomputed()
+      skeletons[label] = skel.to_precomputed()
+
+    return skeletons
+
+  def get_unfused(self, labels, filenames, cv, frag_path):
+    skeldirfn = lambda loc: cv.meta.join(cv.skeleton.meta.skeleton_path, loc)
+    filenames = [ skeldirfn(loc) for loc in filenames ]
+
+    block_size = 50
+
+    if len(filenames) < block_size:
+      blocks = [ filenames ]
+      n_blocks = 1
+    else:
+      n_blocks = max(len(filenames) // block_size, 1)
+      blocks = sip(filenames, block_size)
+
+    frag_prefix = frag_path or cv.cloudpath
+    local_input = False
+    if paths.extract(frag_prefix).protocol == "file":
+       local_input = True
+       frag_prefix = frag_prefix.replace("file://", "", 1)
+
+    all_skels = defaultdict(list)
+    for filenames_block in tqdm(blocks, desc="Filename Block", total=n_blocks, disable=(not self.progress)):
+      if local_input:
+        all_files = {}
+        for filename in filenames_block:
+          all_files[filename] = open(os.path.join(frag_prefix, filename), "rb")
+      else:
+        all_files = { 
+          filename: CloudFile(cv.meta.join(frag_prefix, filename), cache_meta=True)
+          for filename in filenames_block 
+        } 
+      
+      for filename, content in tqdm(all_files.items(), desc="Scanning Fragments", disable=(not self.progress)):
+        fragment = MapBuffer(content, frombytesfn=Skeleton.from_precomputed)
+
+        for label in labels:
+          try:
+            skel = fragment[label]
+            skel.id = label
+            all_skels[label].append(skel)
+          except KeyError:
+            continue
+
+        if hasattr(content, "close"):
+          content.close()
+
+    return all_skels
+
+  def locations_for_labels(self, labels, cv):
+    SPATIAL_EXT = re.compile(r'\.spatial$')
+    index_filenames = cv.skeleton.spatial_index.file_locations_per_label(labels)
+    for label, locations in index_filenames.items():
+      for i, location in enumerate(locations):
+        bbx = Bbox.from_filename(re.sub(SPATIAL_EXT, '', location))
+        bbx /= cv.meta.resolution(cv.skeleton.meta.mip)
+        index_filenames[label][i] = bbx.to_filename() + '.frags'
+    return index_filenames
+
+def labels_for_shard(cv, shard_no, progress):
+  """
+  Try to fetch precalculated labels from `$shardno.labels` (faster) otherwise, 
+  compute which labels are applicable to this shard from the shard index (much slower).
+  """
+  labels = CloudFiles(cv.skeleton.meta.layerpath).get_json(shard_no + '.labels')
+  if labels is not None:
+    return labels
+
+  labels = cv.skeleton.spatial_index.query(cv.bounds * cv.resolution)
+  spec = cv.skeleton.reader.spec
+
+  return [ 
+    lbl for lbl in tqdm(labels, desc="Computing Shard Numbers", disable=(not progress))  \
+    if spec.compute_shard_location(lbl).shard_number == shard_no 
+  ]
+
+@queueable
+def ShardedFromUnshardedSkeletonMergeTask(
+  src:str,
+  dest:str,
+  shard_no:str,
+  cache_control:bool = False,
+  skel_dir:Optional[str] = None,
+  progress:bool = False,
+):
+  cv_src = CloudVolume(src)
+
+  if skel_dir is None and 'skeletons' in cv.info:
+    skel_dir = cv.info['skeletons']
+
+  cv_dest = CloudVolume(dest, skel_dir=skel_dir, progress=progress)
+
+  labels = labels_for_shard(cv_dest, shard_no, progress)
+  skeletons = cv_src.skeleton.get(labels)
+  del labels
+
+  if len(skeletons) == 0:
+    return
+
+  skeletons = strip_integer_attributes(skeletons)
+  skeletons = { skel.id: skel.to_precomputed() for skel in skeletons }
+  shard_files = synthesize_shard_files(cv_dest.skeleton.reader.spec, skeletons)
+
+  if len(shard_files) != 1:
+    raise ValueError(
+      "Only one shard file should be generated per task. Expected: {} Got: {} ".format(
+        str(shard_no), ", ".join(shard_files.keys())
+    ))
+
+  cf = CloudFiles(cv_dest.skeleton.meta.layerpath, progress=progress)
+  cf.puts( 
+    ( (fname, data) for fname, data in shard_files.items() ),
+    compress=False,
+    content_type='application/octet-stream',
+    cache_control='no-cache',      
+  )
+
+@queueable
+def DeleteSkeletonFilesTask(
+  cloudpath:str,
+  prefix:str,
+  skel_dir:Optional[str] = None
+):
+  cv = CloudVolume(cloudpath, skel_dir=skel_dir)
+  cf = CloudFiles(cv.skeleton.meta.layerpath)
+  cf.delete(cf.list(prefix=prefix))
+
+
+@queueable
+def TransferSkeletonFilesTask(
+  src:str,
+  dest:str,
+  prefix:str,
+  skel_dir:Optional[str] = None
+):
+  cv_src = CloudVolume(src)
+  cv_dest = CloudVolume(dest, skel_dir=skel_dir)
+
+  cf_src = CloudFiles(cv_src.skeleton.meta.layerpath)
+  cf_dest = CloudFiles(cv_dest.skeleton.meta.layerpath)
+
+  cf_src.transfer_to(cf_dest, paths=cf_src.list(prefix=prefix))
diff --git a/igneous_cli/cli.py b/igneous_cli/cli.py
index 5a17e87f..c6688f6d 100644
--- a/igneous_cli/cli.py
+++ b/igneous_cli/cli.py
@@ -1302,6 +1302,7 @@ def skeletongroup():
 @click.option('--timestamp', type=int, default=None, help="(graphene) Use the proofreading state at this UNIX timestamp.", show_default=True)
 @click.option('--root-ids', type=CloudPath(), default=None, help="(graphene) If you have a materialization of graphene root ids for this timepoint, it's more efficient to use it than making requests to the graphene server.", show_default=True)
 @click.option('--progress', is_flag=True, default=False, help="Print progress bars.", show_default=True)
+@click.option('--split-at-branches', is_flag=True, default=False, help="Split skeletons at branch points. Surface-touching fragments get original IDs and will be merged across chunks. Interior skeletons get unique IDs and are finalized.", show_default=True)
 @click.pass_context
 def skeleton_forge(
   ctx, path, queue, mip, shape, 
@@ -1310,7 +1311,7 @@ def skeleton_forge(
   fill_holes, scale, const, soma_detect, soma_accept,
   soma_scale, soma_const, max_paths, sharded, labels,
   cross_section, output, timestamp, root_ids, progress,
-  cross_section_label_repair_sec,
+  cross_section_label_repair_sec, split_at_branches,
 ):
   """
   (1) Synthesize skeletons from segmentation cutouts.
@@ -1358,6 +1359,7 @@ def skeleton_forge(
     frag_path=output, fix_autapses=fix_autapses,
     timestamp=timestamp, root_ids_cloudpath=root_ids,
     cross_sectional_area_repair_sec_per_label=cross_section_label_repair_sec,
+    split_at_branches=split_at_branches,
   )
 
   enqueue_tasks(ctx, queue, tasks)

From e0cce011f9fe050320aec19cb82f57af5833570c Mon Sep 17 00:00:00 2001
From: Wan-Qing Yu <wanqing.yu@alleninstitute.org>
Date: Tue, 7 Oct 2025 11:21:22 -0700
Subject: [PATCH 3/6] fix a typo in skel xfer task

---
 .dockerignore                             |   0
 .github/workflows/docker-image.yml        |   0
 .github/workflows/test-suite.yml          |   0
 CITATION.cff                              |   0
 LICENSE                                   |   0
 igneous/shards.py                         |   0
 igneous/task_creation/__init__.py         |   0
 igneous/task_creation/common.py           |   0
 igneous/task_creation/image.py            |   0
 igneous/task_creation/mesh.py             |   0
 igneous/task_creation/obsolete.py         |   0
 igneous/task_creation/skeleton.py         |   0
 igneous/tasks/__init__.py                 |   0
 igneous/tasks/image/__init__.py           |   0
 igneous/tasks/image/ccl.py                |   0
 igneous/tasks/image/obsolete.py           |   0
 igneous/tasks/mesh/__init__.py            |   0
 igneous/tasks/mesh/draco.py               |   0
 igneous/tasks/mesh/mesh.py                |   0
 igneous/tasks/mesh/mesh_graphene_remap.py |   0
 igneous/tasks/mesh/multires.py            |   0
 igneous/tasks/skeleton.py                 |   4 ++--
 igneous/tasks/skeleton_mod.py             |   0
 igneous/tasks/skeleton_ori.py             |   0
 igneous/tasks/spatial_index.py            |   0
 igneous/types.py                          |   0
 igneous_cli/LICENSE                       |   0
 igneous_cli/__init__.py                   |   0
 igneous_cli/cli.py                        |   0
 igneous_cli/humanbytes.py                 |   0
 pyproject.toml                            |   0
 test/connectomics.npy.ckl.gz              | Bin
 test/test_ccl_tasks.py                    |   0
 test/test_shards.py                       |   0
 test/test_transfer_tasks.py               |   0
 35 files changed, 2 insertions(+), 2 deletions(-)
 mode change 100644 => 100755 .dockerignore
 mode change 100644 => 100755 .github/workflows/docker-image.yml
 mode change 100644 => 100755 .github/workflows/test-suite.yml
 mode change 100644 => 100755 CITATION.cff
 mode change 100644 => 100755 LICENSE
 mode change 100644 => 100755 igneous/shards.py
 mode change 100644 => 100755 igneous/task_creation/__init__.py
 mode change 100644 => 100755 igneous/task_creation/common.py
 mode change 100644 => 100755 igneous/task_creation/image.py
 mode change 100644 => 100755 igneous/task_creation/mesh.py
 mode change 100644 => 100755 igneous/task_creation/obsolete.py
 mode change 100644 => 100755 igneous/task_creation/skeleton.py
 mode change 100644 => 100755 igneous/tasks/__init__.py
 mode change 100644 => 100755 igneous/tasks/image/__init__.py
 mode change 100644 => 100755 igneous/tasks/image/ccl.py
 mode change 100644 => 100755 igneous/tasks/image/obsolete.py
 mode change 100644 => 100755 igneous/tasks/mesh/__init__.py
 mode change 100644 => 100755 igneous/tasks/mesh/draco.py
 mode change 100644 => 100755 igneous/tasks/mesh/mesh.py
 mode change 100644 => 100755 igneous/tasks/mesh/mesh_graphene_remap.py
 mode change 100644 => 100755 igneous/tasks/mesh/multires.py
 mode change 100644 => 100755 igneous/tasks/skeleton.py
 mode change 100644 => 100755 igneous/tasks/skeleton_mod.py
 mode change 100644 => 100755 igneous/tasks/skeleton_ori.py
 mode change 100644 => 100755 igneous/tasks/spatial_index.py
 mode change 100644 => 100755 igneous/types.py
 mode change 100644 => 100755 igneous_cli/LICENSE
 mode change 100644 => 100755 igneous_cli/__init__.py
 mode change 100644 => 100755 igneous_cli/cli.py
 mode change 100644 => 100755 igneous_cli/humanbytes.py
 mode change 100644 => 100755 pyproject.toml
 mode change 100644 => 100755 test/connectomics.npy.ckl.gz
 mode change 100644 => 100755 test/test_ccl_tasks.py
 mode change 100644 => 100755 test/test_shards.py
 mode change 100644 => 100755 test/test_transfer_tasks.py

diff --git a/.dockerignore b/.dockerignore
old mode 100644
new mode 100755
diff --git a/.github/workflows/docker-image.yml b/.github/workflows/docker-image.yml
old mode 100644
new mode 100755
diff --git a/.github/workflows/test-suite.yml b/.github/workflows/test-suite.yml
old mode 100644
new mode 100755
diff --git a/CITATION.cff b/CITATION.cff
old mode 100644
new mode 100755
diff --git a/LICENSE b/LICENSE
old mode 100644
new mode 100755
diff --git a/igneous/shards.py b/igneous/shards.py
old mode 100644
new mode 100755
diff --git a/igneous/task_creation/__init__.py b/igneous/task_creation/__init__.py
old mode 100644
new mode 100755
diff --git a/igneous/task_creation/common.py b/igneous/task_creation/common.py
old mode 100644
new mode 100755
diff --git a/igneous/task_creation/image.py b/igneous/task_creation/image.py
old mode 100644
new mode 100755
diff --git a/igneous/task_creation/mesh.py b/igneous/task_creation/mesh.py
old mode 100644
new mode 100755
diff --git a/igneous/task_creation/obsolete.py b/igneous/task_creation/obsolete.py
old mode 100644
new mode 100755
diff --git a/igneous/task_creation/skeleton.py b/igneous/task_creation/skeleton.py
old mode 100644
new mode 100755
diff --git a/igneous/tasks/__init__.py b/igneous/tasks/__init__.py
old mode 100644
new mode 100755
diff --git a/igneous/tasks/image/__init__.py b/igneous/tasks/image/__init__.py
old mode 100644
new mode 100755
diff --git a/igneous/tasks/image/ccl.py b/igneous/tasks/image/ccl.py
old mode 100644
new mode 100755
diff --git a/igneous/tasks/image/obsolete.py b/igneous/tasks/image/obsolete.py
old mode 100644
new mode 100755
diff --git a/igneous/tasks/mesh/__init__.py b/igneous/tasks/mesh/__init__.py
old mode 100644
new mode 100755
diff --git a/igneous/tasks/mesh/draco.py b/igneous/tasks/mesh/draco.py
old mode 100644
new mode 100755
diff --git a/igneous/tasks/mesh/mesh.py b/igneous/tasks/mesh/mesh.py
old mode 100644
new mode 100755
diff --git a/igneous/tasks/mesh/mesh_graphene_remap.py b/igneous/tasks/mesh/mesh_graphene_remap.py
old mode 100644
new mode 100755
diff --git a/igneous/tasks/mesh/multires.py b/igneous/tasks/mesh/multires.py
old mode 100644
new mode 100755
diff --git a/igneous/tasks/skeleton.py b/igneous/tasks/skeleton.py
old mode 100644
new mode 100755
index a8959179..5267de32
--- a/igneous/tasks/skeleton.py
+++ b/igneous/tasks/skeleton.py
@@ -1258,8 +1258,8 @@ def ShardedFromUnshardedSkeletonMergeTask(
 ):
   cv_src = CloudVolume(src)
 
-  if skel_dir is None and 'skeletons' in cv.info:
-    skel_dir = cv.info['skeletons']
+  if skel_dir is None and 'skeletons' in cv_src.info:
+    skel_dir = cv_src.info['skeletons']
 
   cv_dest = CloudVolume(dest, skel_dir=skel_dir, progress=progress)
 
diff --git a/igneous/tasks/skeleton_mod.py b/igneous/tasks/skeleton_mod.py
old mode 100644
new mode 100755
diff --git a/igneous/tasks/skeleton_ori.py b/igneous/tasks/skeleton_ori.py
old mode 100644
new mode 100755
diff --git a/igneous/tasks/spatial_index.py b/igneous/tasks/spatial_index.py
old mode 100644
new mode 100755
diff --git a/igneous/types.py b/igneous/types.py
old mode 100644
new mode 100755
diff --git a/igneous_cli/LICENSE b/igneous_cli/LICENSE
old mode 100644
new mode 100755
diff --git a/igneous_cli/__init__.py b/igneous_cli/__init__.py
old mode 100644
new mode 100755
diff --git a/igneous_cli/cli.py b/igneous_cli/cli.py
old mode 100644
new mode 100755
diff --git a/igneous_cli/humanbytes.py b/igneous_cli/humanbytes.py
old mode 100644
new mode 100755
diff --git a/pyproject.toml b/pyproject.toml
old mode 100644
new mode 100755
diff --git a/test/connectomics.npy.ckl.gz b/test/connectomics.npy.ckl.gz
old mode 100644
new mode 100755
diff --git a/test/test_ccl_tasks.py b/test/test_ccl_tasks.py
old mode 100644
new mode 100755
diff --git a/test/test_shards.py b/test/test_shards.py
old mode 100644
new mode 100755
diff --git a/test/test_transfer_tasks.py b/test/test_transfer_tasks.py
old mode 100644
new mode 100755

From 5f344e3ee8f95da3f8db6a47d20a6769d70095fb Mon Sep 17 00:00:00 2001
From: Wan-Qing Yu <wanqing.yu@alleninstitute.org>
Date: Wed, 8 Oct 2025 18:59:39 -0700
Subject: [PATCH 4/6] update connected component and only keep skeletons touch
 interior surfaces

---
 igneous/tasks/skeleton.py | 283 ++++++++++++++++++--------------------
 1 file changed, 134 insertions(+), 149 deletions(-)

diff --git a/igneous/tasks/skeleton.py b/igneous/tasks/skeleton.py
index 5267de32..dd2f0568 100755
--- a/igneous/tasks/skeleton.py
+++ b/igneous/tasks/skeleton.py
@@ -175,6 +175,7 @@ def execute(self):
       else:
         path = self.frag_path
 
+    # to do: needs to handle corrupted data gracefully
     all_labels, mapping = vol.download(           
       bbox.to_slices(), 
       agglomerate=True, 
@@ -625,215 +626,199 @@ def reprocess_skel(pts, skel):
   def split_and_reassign_ids(self, skeletons, vol, bbox):
     """
     Split skeletons at branch points.
-    Keep label=1 for surface-touching fragments (need merging).
-    Assign unique IDs to interior skeletons (finalized).
+    Keep label=1 for INTERIOR-surface-touching fragments (need merging).
+    Assign unique IDs to other skeletons (finalized).
     """
-    surface_fragments = []  # Will all become label=1
-    interior_skeletons = {}  # Get unique IDs
+    surface_fragments = []
+    interior_skeletons = {}
     
     next_interior_id = self.generate_base_id_for_chunk()
-    print(f"DEBUG: Processing {len(skeletons)} original skeletons in chunk {self.chunk_index}")
-    print(f"DEBUG: Base ID for interior skeletons: {next_interior_id}")
-    print(f"DEBUG: Chunk bbox: {bbox}")
-    print(f"DEBUG: Volume resolution: {vol.resolution}")
     
-    for label, skel in skeletons.items():
-        print(f"DEBUG: Processing skeleton {label} with {len(skel.vertices)} vertices")
-        
-        # Debug: Check original skeleton boundary touching
-        touches_original = self.skeleton_touches_surface(skel, vol.resolution)
-        print(f"DEBUG: Original skeleton {label} touches surface: {touches_original}")
+    if self.progress:
+        print(f"Processing {len(skeletons)} skeletons in chunk {self.chunk_index}")
+        print(f"Base ID for interior skeletons: {next_interior_id}")
         
+        # Debug: show which faces are interior
+        interior_faces = self.get_interior_faces(vol)
+        face_names = ['min_x', 'max_x', 'min_y', 'max_y', 'min_z', 'max_z']
+        interior_face_names = [name for name, is_interior in zip(face_names, interior_faces) if is_interior]
+        print(f"Interior faces for this chunk: {interior_face_names}")
+    
+    for label, skel in skeletons.items():
+        if len(skel.vertices) == 0 or len(skel.edges) == 0:
+            if self.progress:
+                print(f"Skipping empty skeleton {label}")
+            continue
+            
         # Split at branches
         sub_skels = self.split_skeleton_at_branches(skel)
-        print(f"DEBUG: Split into {len(sub_skels)} sub-skeletons")
         
         for i, sub_skel in enumerate(sub_skels):
-            print(f"DEBUG: Sub-skeleton {i} has {len(sub_skel.vertices)} vertices")
-            # Add safety check for empty skeletons
             if len(sub_skel.vertices) == 0 or len(sub_skel.edges) == 0:
-                print(f"DEBUG: Sub-skeleton {i} is empty, skipping")
                 continue
             
-            # Debug vertex positions
-            vertices_voxels = sub_skel.vertices / vol.resolution
-            min_coords = np.min(vertices_voxels, axis=0)
-            max_coords = np.max(vertices_voxels, axis=0)
-            print(f"DEBUG: Sub-skeleton {i} vertex range: min={min_coords}, max={max_coords}")
+            # Check if touches INTERIOR surfaces only
+            touches_interior_surface = self.skeleton_touches_interior_surface(
+                sub_skel, vol.resolution, vol
+            )
             
-            touches_surface = self.skeleton_touches_surface(sub_skel, vol.resolution)
-            print(f"DEBUG: Sub-skeleton {i} touches surface: {touches_surface}")
-            
-            if touches_surface:
-                print(f"DEBUG: Sub-skeleton {i} -> SURFACE FRAGMENT (ID=1)")
+            if touches_interior_surface:
+                if self.progress:
+                    print(f"Sub-skeleton {i} -> SURFACE FRAGMENT (ID=1) - touches interior boundary")
                 surface_fragments.append(sub_skel)
             else:
-                print(f"DEBUG: Sub-skeleton {i} -> INTERIOR SKELETON (ID={next_interior_id})")
+                if self.progress:
+                    print(f"Sub-skeleton {i} -> INTERIOR SKELETON (ID={next_interior_id}) - no interior boundary contact")
                 sub_skel.id = next_interior_id
                 interior_skeletons[next_interior_id] = sub_skel
                 next_interior_id += 1
     
-    print(f"DEBUG: Final counts - Surface fragments: {len(surface_fragments)}, Interior skeletons: {len(interior_skeletons)}")
-    print(f"DEBUG: Interior skeleton IDs: {list(interior_skeletons.keys())}")
-    
-    # Merge all surface fragments into single label=1 skeleton
+    # Merge surface fragments and return result
     result = {}
     if surface_fragments:
         if len(surface_fragments) == 1:
             result[1] = surface_fragments[0]
             result[1].id = 1
         else:
-            # Use osteoid.Skeleton.simple_merge
             from osteoid import Skeleton
             merged = Skeleton.simple_merge(surface_fragments)
             merged.id = 1
             result[1] = merged
     
-    # Add all interior skeletons
     result.update(interior_skeletons)
-    
     return result
   
   def split_skeleton_at_branches(self, skeleton):
     """
-    Split skeleton at branch points by removing branch nodes and finding connected components.
-    Works with osteoid.Skeleton objects from Kimimaro.
+    Split skeleton at branch points using osteoid.Skeleton's components() method.
     """
-    # Get branch nodes using osteoid.Skeleton method
+    # Get branch nodes
     branch_nodes = skeleton.branches()
     
     if len(branch_nodes) == 0:
         return [skeleton]
     
-    # Create mask to remove branch nodes
-    mask = np.ones(len(skeleton.vertices), dtype=bool)
+    # Create a copy without branch nodes
+    from osteoid import Skeleton
+    temp_skeleton = skeleton.clone()
+    
+    # Remove branch nodes (this should disconnect the skeleton)
+    mask = np.ones(len(temp_skeleton.vertices), dtype=bool)
     mask[branch_nodes] = False
-
-    # Create a mapping from old indices to new indices
-    old_to_new_indices = np.full(len(skeleton.vertices), -1, dtype=int)
-    old_to_new_indices[mask] = np.arange(np.sum(mask))
-
-    # Get vertices without branch nodes
-    filtered_vertices = skeleton.vertices[mask]
-    filtered_radius = skeleton.radius[mask] if skeleton.radius is not None else None
-
-    # Remove edges that contain branch nodes
-    valid_edges = skeleton.edges[~np.isin(skeleton.edges, branch_nodes).any(axis=1)]
-
-    if len(valid_edges) == 0:
-        return []
-
-    # Remap the edges to the new vertex indices
-    remapped_edges = old_to_new_indices[valid_edges]
-
-    # Find connected components in the filtered graph
-    components = self._find_connected_components(remapped_edges, len(filtered_vertices))
-
-    # Create new skeletons for each component
-    sub_skeletons = []
-    for i, component in enumerate(components):
-        if len(component) < 2:
-            continue
-            
-        # Create mapping for this component
-        component_old_to_new = {old_idx: new_idx for new_idx, old_idx in enumerate(component)}
-        
-        # Extract vertices and radius for this component
-        component_vertices = filtered_vertices[component]
-        component_radius = filtered_radius[component] if filtered_radius is not None else None
-        
-        # Extract edges for this component
-        component_edges = []
-        for edge in remapped_edges:
-            if edge[0] in component_old_to_new and edge[1] in component_old_to_new:
-                new_edge = [component_old_to_new[edge[0]], component_old_to_new[edge[1]]]
-                component_edges.append(new_edge)
-        
-        if len(component_edges) > 0:
-            # Create new osteoid.Skeleton - use the correct constructor
-            from osteoid import Skeleton
-            new_skeleton = Skeleton()
-            new_skeleton.vertices = component_vertices.copy()
-            new_skeleton.edges = np.array(component_edges, dtype=skeleton.edges.dtype)
-            if component_radius is not None:
-                new_skeleton.radius = component_radius.copy()
-            new_skeleton.id = f"{skeleton.id}_{i}" if hasattr(skeleton, 'id') else f"skel_{i}"
-            
-            # Copy other attributes if they exist
-            if hasattr(skeleton, 'vertex_types') and skeleton.vertex_types is not None:
-                try:
-                    new_skeleton.vertex_types = skeleton.vertex_types[mask][component].copy()
-                except:
-                    pass  # vertex_types might not be compatible
-            
-            sub_skeletons.append(new_skeleton)
     
-    return sub_skeletons if sub_skeletons else []
-  
-  def _find_connected_components(self, edges, num_vertices):
+    # Filter vertices and edges
+    temp_skeleton.vertices = temp_skeleton.vertices[mask]
+    if temp_skeleton.radius is not None:
+        temp_skeleton.radius = temp_skeleton.radius[mask]
+    
+    # Remove edges containing branch nodes
+    valid_edges = temp_skeleton.edges[~np.isin(temp_skeleton.edges, branch_nodes).any(axis=1)]
+    
+    # Remap edge indices
+    old_to_new = np.full(len(skeleton.vertices), -1, dtype=int)
+    old_to_new[mask] = np.arange(np.sum(mask))
+    temp_skeleton.edges = old_to_new[valid_edges]
+    
+    # Use components() to get disconnected parts
+    components = temp_skeleton.components()
+    
+    # Filter and return valid components
+    return [comp for comp in components if len(comp.vertices) >= 2 and len(comp.edges) > 0]
+
+  def get_interior_faces_from_coords(self):
     """
-    Find connected components using Union-Find (Disjoint Set Union).
-    Returns list of components, where each component is a list of vertex indices.
+    Determine interior faces using chunk coordinates (more reliable if available).
     """
-    # Initialize Union-Find structure
-    parent = list(range(num_vertices))
+    if (self.chunk_coords is None or 
+        self.global_chunks_per_dim is None):
+        return None
     
-    def find(x):
-        if parent[x] != x:
-            parent[x] = find(parent[x])  # Path compression
-        return parent[x]
+    cx, cy, cz = self.chunk_coords
+    chunks_x, chunks_y, chunks_z = self.global_chunks_per_dim
     
-    def union(x, y):
-        root_x = find(x)
-        root_y = find(y)
-        if root_x != root_y:
-            parent[root_x] = root_y
-    
-    # Union vertices connected by edges
-    for edge in edges:
-        union(edge[0], edge[1])
+    interior_faces = [
+        cx > 0,                    # min_x face is interior
+        cx < chunks_x - 1,         # max_x face is interior
+        cy > 0,                    # min_y face is interior  
+        cy < chunks_y - 1,         # max_y face is interior
+        cz > 0,                    # min_z face is interior
+        cz < chunks_z - 1,         # max_z face is interior
+    ]
     
-    # Group vertices by their root parent
-    from collections import defaultdict
-    components_dict = defaultdict(list)
-    for vertex in range(num_vertices):
-        root = find(vertex)
-        components_dict[root].append(vertex)
+    return interior_faces
+
+  def get_interior_faces(self, vol):
+    """
+    Determine which chunk faces are interior with fallback methods.
+    """
+    # Try coordinate-based method first (more reliable)
+    interior_faces = self.get_interior_faces_from_coords()
+    if interior_faces is not None:
+        return interior_faces
     
-    # Convert to list of components
-    components = list(components_dict.values())
+    # Fallback to bbox comparison
+    chunk_bbox = self.bounds
     
-    # Filter out single-vertex components (isolated vertices)
-    components = [comp for comp in components if len(comp) > 1]
+    # Parse volume_bounds if it's a string
+    if isinstance(self.volume_bounds, str):
+        import json
+        volume_bounds_dict = json.loads(self.volume_bounds)
+        from cloudvolume.lib import Bbox, Vec
+        volume_bbox = Bbox(
+            Vec(*volume_bounds_dict['minpt']),
+            Vec(*volume_bounds_dict['maxpt'])
+        )
+    elif self.volume_bounds is not None:
+        volume_bbox = self.volume_bounds
+    else:
+        volume_bbox = vol.bounds
     
-    return components
+    # Add small epsilon to handle floating point precision
+    epsilon = vol.resolution.min() * 0.1
     
-  def skeleton_touches_surface(self, skeleton, resolution, tolerance_voxels=1):
-    """Check if any vertex touches the chunk boundary in LOCAL VOXEL space."""
+    interior_faces = [
+        chunk_bbox.minpt.x > volume_bbox.minpt.x + epsilon,
+        chunk_bbox.maxpt.x < volume_bbox.maxpt.x - epsilon,
+        chunk_bbox.minpt.y > volume_bbox.minpt.y + epsilon,
+        chunk_bbox.maxpt.y < volume_bbox.maxpt.y - epsilon,
+        chunk_bbox.minpt.z > volume_bbox.minpt.z + epsilon,
+        chunk_bbox.maxpt.z < volume_bbox.maxpt.z - epsilon,
+    ]
     
-    # Vertices are already in local voxel coordinates at this point
+    return interior_faces
+  
+  def skeleton_touches_interior_surface(self, skeleton, resolution, vol, tolerance_voxels=1):
+    """
+    Check if skeleton touches any INTERIOR chunk boundary (excludes volume boundaries).
+    """
     vertices_voxels = skeleton.vertices / resolution
-    
-    # Get chunk shape directly
     chunk_shape = Vec(*self.shape)
     
-    print(f"DEBUG SURFACE: Checking {len(vertices_voxels)} vertices")
-    print(f"DEBUG SURFACE: Chunk shape: {chunk_shape}")
-    print(f"DEBUG SURFACE: Local bounds: [0,0,0] to {chunk_shape}")
-    print(f"DEBUG SURFACE: Tolerance: {tolerance_voxels} voxels")
+    # Get which faces are interior (connect to other chunks)
+    interior_faces = self.get_interior_faces(vol)
+    
+    print(f"DEBUG SURFACE: Interior faces: {interior_faces}")
+    print(f"DEBUG SURFACE: [min_x, max_x, min_y, max_y, min_z, max_z]")
     
-    # Check against local chunk boundaries (0 to chunk_shape in each dimension)
+    # Check each dimension, but only interior faces
     for dim in range(3):
-        # Check if vertices touch the minimum boundary (near 0)
-        near_min = np.any(vertices_voxels[:, dim] <= tolerance_voxels)
-        # Check if vertices touch the maximum boundary (near chunk_shape)
-        near_max = np.any(vertices_voxels[:, dim] >= chunk_shape[dim] - tolerance_voxels)
+        min_face_idx = dim * 2      # 0, 2, 4 for x, y, z min faces
+        max_face_idx = dim * 2 + 1  # 1, 3, 5 for x, y, z max faces
         
-        if near_min or near_max:
-            print(f"DEBUG SURFACE: SURFACE TOUCH detected in dimension {dim}")
-            return True
+        # Only check interior faces
+        if interior_faces[min_face_idx]:  # min face is interior
+            near_min = np.any(vertices_voxels[:, dim] <= tolerance_voxels)
+            if near_min:
+                print(f"DEBUG SURFACE: INTERIOR SURFACE TOUCH detected at min face of dimension {dim}")
+                return True
+                
+        if interior_faces[max_face_idx]:  # max face is interior  
+            near_max = np.any(vertices_voxels[:, dim] >= chunk_shape[dim] - tolerance_voxels)
+            if near_max:
+                print(f"DEBUG SURFACE: INTERIOR SURFACE TOUCH detected at max face of dimension {dim}")
+                return True
     
-    print(f"DEBUG SURFACE: NO SURFACE TOUCH detected")
+    print(f"DEBUG SURFACE: NO INTERIOR SURFACE TOUCH detected")
     return False
     
   def generate_base_id_for_chunk(self):

From 79cd074aa76e1ca51c957b82512f3376d26d4616 Mon Sep 17 00:00:00 2001
From: Wan-Qing Yu <wanqing.yu@alleninstitute.org>
Date: Wed, 8 Oct 2025 19:06:25 -0700
Subject: [PATCH 5/6] remove temp file

---
 igneous/tasks/skeleton_mod.py | 1292 ---------------------------------
 igneous/tasks/skeleton_ori.py |  914 -----------------------
 2 files changed, 2206 deletions(-)
 delete mode 100755 igneous/tasks/skeleton_mod.py
 delete mode 100755 igneous/tasks/skeleton_ori.py

diff --git a/igneous/tasks/skeleton_mod.py b/igneous/tasks/skeleton_mod.py
deleted file mode 100755
index 3671987c..00000000
--- a/igneous/tasks/skeleton_mod.py
+++ /dev/null
@@ -1,1292 +0,0 @@
-from typing import Optional, Sequence, Dict, List
-
-from functools import reduce
-import itertools
-import json
-import mmap
-import pickle
-import posixpath
-import os
-import re
-from collections import defaultdict
-
-from tqdm import tqdm
-
-import numpy as np
-
-import mapbuffer
-from mapbuffer import MapBuffer, IntMap
-import cloudfiles
-from cloudfiles import CloudFiles, CloudFile
-
-import cloudvolume
-from cloudvolume import CloudVolume, Skeleton, paths
-from cloudvolume.lib import Vec, Bbox, sip, xyzrange
-from cloudvolume.datasource.precomputed.sharding import synthesize_shard_files
-
-import cc3d
-import crackle
-import fastmorph
-import fastremap
-import kimimaro
-
-from taskqueue import RegisteredTask, queueable
-
-SEGIDRE = re.compile(r'/(\d+):.*?$')
-
-def filename_to_segid(filename):
-  matches = SEGIDRE.search(filename)
-  if matches is None:
-    raise ValueError("There was an issue with the fragment filename: " + filename)
-
-  segid, = matches.groups()
-  return int(segid)
-
-def strip_integer_attributes(skeletons):
-  for skel in skeletons:
-    skel.extra_attributes = [ 
-    attr for attr in skel.extra_attributes 
-    if attr['data_type'] in ('float32', 'float64')
-  ]
-  return skeletons
-
-class SkeletonTask(RegisteredTask):
-  """
-  Stage 1 of skeletonization.
-
-  Convert chunks of segmentation into chunked skeletons and point clouds.
-  They will be merged in the stage 2 task SkeletonMergeTask.
-  """
-  def __init__(
-    self, cloudpath:str, 
-    shape:Sequence[int], offset:Sequence[int], 
-    mip:int, teasar_params:dict, will_postprocess:bool,
-    info:dict = None, 
-    object_ids:Optional[Sequence[int]] = None,
-    mask_ids:Optional[Sequence[int]] = None,
-    fix_branching:bool = True,
-    fix_borders:bool = True,
-    fix_avocados:bool = False,
-    fill_holes:int = 0,
-    dust_threshold:int = 1000, 
-    progress:bool = False,
-    parallel:int = 1,
-    fill_missing:bool = False,
-    sharded:bool = False,
-    frag_path:Optional[str] = None, 
-    spatial_index:bool = True,
-    spatial_grid_shape:Optional[Sequence[int]] = None,
-    synapses:Optional[Sequence[Sequence[float]]] = None, 
-    dust_global:bool = False,
-    cross_sectional_area:bool = False,
-    cross_sectional_area_smoothing_window:int = 1,
-    cross_sectional_area_shape_delta:int = 150,
-    dry_run:bool = False,
-    strip_integer_attributes:bool = True,
-    fix_autapses:bool = False,
-    timestamp:Optional[int] = None,
-    root_ids_cloudpath:Optional[str] = None,
-  ):
-    super().__init__(
-      cloudpath, shape, offset, mip, 
-      teasar_params, will_postprocess, 
-      info, object_ids, mask_ids,
-      fix_branching, fix_borders, 
-      fix_avocados, fill_holes,
-      dust_threshold, progress, parallel,
-      fill_missing, bool(sharded), frag_path, bool(spatial_index),
-      spatial_grid_shape, synapses, bool(dust_global),
-      bool(cross_sectional_area), int(cross_sectional_area_smoothing_window),
-      int(cross_sectional_area_shape_delta),
-      bool(dry_run), bool(strip_integer_attributes),
-      bool(fix_autapses), timestamp,
-      root_ids_cloudpath,
-    )
-    if isinstance(self.frag_path, str):
-      self.frag_path = cloudfiles.paths.normalize(self.frag_path)
-    self.bounds = Bbox(offset, Vec(*shape) + Vec(*offset))
-    self.index_bounds = Bbox(offset, Vec(*spatial_grid_shape) + Vec(*offset))
-
-    # aggressive morphological hole filling has a 1-2vx 
-    # edge effect that needs to be cropped away
-    self.hole_filling_padding = (self.fill_holes >= 3) * 2
-
-  def execute(self):
-    # For graphene volumes, if we've materialized the root IDs
-    # into a static archive, let's use that because it's way more
-    # efficient for fetching root IDs.
-    cloudpath = self.cloudpath
-    if self.root_ids_cloudpath:
-      cloudpath = self.root_ids_cloudpath
-
-    lru_bytes = 0
-    lru_encoding = 'same'
-
-    if self.cross_sectional_area:
-      lru_bytes = self.bounds.size() + 2 * self.cross_sectional_area_shape_delta
-      lru_bytes = lru_bytes[0] * lru_bytes[1] * lru_bytes[2] * 8 // 500
-      lru_encoding = 'crackle'
-
-    vol = CloudVolume(
-      cloudpath,
-      mip=self.mip,
-      bounded=(self.hole_filling_padding == 0),
-      info=self.info,
-      cdn_cache=False,
-      parallel=self.parallel,
-      fill_missing=self.fill_missing,
-      lru_bytes=lru_bytes,
-      lru_encoding=lru_encoding,
-    )
-    bbox = Bbox.clamp(self.bounds, vol.bounds)
-    index_bbox = Bbox.clamp(self.index_bounds, vol.bounds)
-
-    bbox.minpt -= self.hole_filling_padding
-    bbox.maxpt += self.hole_filling_padding
-
-    path = vol.info.get("skeletons", "skeletons")
-    if self.frag_path is None:
-      path = vol.meta.join(self.cloudpath, path)
-    else:
-      # if the path is to a volume root, follow the info instructions,
-      # otherwise place the files exactly where frag path says to
-      test_path = CloudFiles(self.frag_path).join(self.frag_path, "info")
-      test_info = CloudFile(test_path).get_json()
-      if test_info is not None and 'scales' in test_info:
-        path = CloudFiles(self.frag_path).join(self.frag_path, path)
-      else:
-        path = self.frag_path
-
-    all_labels = vol.download(
-      bbox.to_slices(), 
-      agglomerate=True, 
-      timestamp=self.timestamp
-    )
-    all_labels = all_labels[:,:,:,0]
-
-    if self.mask_ids:
-      all_labels = fastremap.mask(all_labels, self.mask_ids)
-
-    extra_targets_after = {}
-    if self.synapses:
-      extra_targets_after = kimimaro.synapses_to_targets(
-        all_labels, self.synapses
-      )
-
-    dust_threshold = self.dust_threshold
-    if self.dust_global and dust_threshold > 0:
-      dust_threshold = 0
-      all_labels = self.apply_global_dust_threshold(vol, all_labels)
-
-    if self.fill_holes and self.fix_autapses:
-      raise ValueError("fill_holes is not currently compatible with fix_autapses")
-
-    voxel_graph = None
-    if self.fix_autapses:
-      voxel_graph = self.voxel_connectivity_graph(vol, bbox, all_labels)
-
-    skeletons = self.skeletonize(
-      all_labels, 
-      vol, 
-      dust_threshold, 
-      extra_targets_after, 
-      voxel_graph,
-    )
-    del all_labels
-
-    if self.cross_sectional_area: # This is expensive!
-      skeletons = self.compute_cross_sectional_area(vol, bbox, skeletons)
-
-    # voxel centered (+0.5) and uses more accurate bounding box from mip 0
-    corrected_offset = (bbox.minpt.astype(np.float32) - vol.meta.voxel_offset(self.mip) + 0.5) * vol.meta.resolution(self.mip)
-    corrected_offset += vol.meta.voxel_offset(0) * vol.meta.resolution(0)
-
-    for segid, skel in skeletons.items():
-      skel.vertices[:] += corrected_offset
-
-    if self.synapses:
-      for segid, skel in skeletons.items():
-        terminal_nodes = skel.vertices[ skel.terminals() ]
-
-        for i, vert in enumerate(terminal_nodes):
-          vert = vert / vol.resolution - self.bounds.minpt
-          vert = tuple(np.round(vert).astype(int))
-          if vert in extra_targets_after.keys():
-            skel.vertex_types[i] = extra_targets_after[vert]
-    
-    # old versions of neuroglancer don't
-    # support int attributes
-    if self.strip_integer_attributes:
-      strip_integer_attributes(skeletons.values())
-
-    if self.dry_run:
-      return skeletons
-
-    if self.sharded:
-      self.upload_batch(vol, path, index_bbox, skeletons)
-    else:
-      self.upload_individuals(vol, path, bbox, skeletons)
-
-    if self.spatial_index:
-      self.upload_spatial_index(vol, path, index_bbox, skeletons)
-
-  def _do_operation(self, all_labels, fn):
-    if self.fill_holes > 0:
-      filled_labels, hole_labels = fastmorph.fill_holes(
-        all_labels,
-        remove_enclosed=True,
-        return_removed=True,
-        fix_borders=(self.fill_holes >= 2),
-        morphological_closing=(self.fill_holes >= 3),
-      )
-
-      if self.fill_holes >= 3:
-        hp = self.hole_filling_padding
-        all_labels = np.asfortranarray(all_labels[hp:-hp,hp:-hp,hp:-hp])
-        filled_labels= np.asfortranarray(filled_labels[hp:-hp,hp:-hp,hp:-hp])
-
-      all_labels = crackle.compress(all_labels)
-      skeletons = fn(filled_labels)
-      del filled_labels
-
-      all_labels = crackle.decompress(all_labels)
-      hole_labels = all_labels * np.isin(all_labels, list(hole_labels))
-      del all_labels
-
-      hole_skeletons = fn(hole_labels)
-      skeletons.update(hole_skeletons)
-      del hole_labels
-      del hole_skeletons
-    else:
-      skeletons = fn(all_labels)
-
-    return skeletons
-
-  def skeletonize(
-    self, 
-    all_labels:np.ndarray, 
-    vol:CloudVolume, 
-    dust_threshold:int, 
-    extra_targets_after:dict, 
-    voxel_graph:np.ndarray,
-  ) -> dict:
-    def do_skeletonize(labels):
-      return kimimaro.skeletonize(
-        labels, self.teasar_params, 
-        object_ids=self.object_ids, 
-        anisotropy=vol.resolution,
-        dust_threshold=dust_threshold, 
-        progress=self.progress, 
-        fix_branching=self.fix_branching,
-        fix_borders=self.fix_borders,
-        fix_avocados=self.fix_avocados,
-        fill_holes=False, # moved this logic into SkeletonTask / fastmorph
-        parallel=self.parallel,
-        extra_targets_after=extra_targets_after.keys(),
-        voxel_graph=voxel_graph,
-      )
-
-    return self._do_operation(all_labels, do_skeletonize)
-
-  def voxel_connectivity_graph(
-    self, 
-    vol:CloudVolume, 
-    bbox:Bbox, 
-    root_labels:np.ndarray,
-  ) -> np.ndarray:
-
-    if vol.meta.path.format != "graphene":
-      vol = CloudVolume(
-        self.cloudpath, mip=self.mip, 
-        info=self.info, cdn_cache=False,
-        parallel=self.parallel, 
-        fill_missing=self.fill_missing,
-      )
-
-    if vol.meta.path.format != "graphene":
-      raise ValueError("Can't extract a voxel connectivity graph from non-graphene volumes.")
-
-    layer_2 = vol.download(
-      bbox, 
-      stop_layer=2,
-      agglomerate=True,
-      timestamp=self.timestamp,
-    )[...,0]
-
-    graph_chunk_size = np.array(vol.meta.graph_chunk_size) / vol.meta.downsample_ratio(vol.mip)
-    graph_chunk_size = graph_chunk_size.astype(int)
-
-    shape = bbox.size()[:3]
-    sgx, sgy, sgz = list(np.ceil(shape / graph_chunk_size).astype(int))
-
-    vcg = cc3d.voxel_connectivity_graph(layer_2, connectivity=26)
-    del layer_2
-
-    # the proper way to do this would be to get the lowest the L3..LN root
-    # as needed, but the lazy way to do this is to get the root labels
-    # which will retain a few errors, but overall the error rate should be
-    # over 100x less. We need to shade in the sides of the connectivity graph
-    # with edges that represent the connections between the adjacent boxes.
-
-    root_vcg = cc3d.voxel_connectivity_graph(root_labels, connectivity=26)
-    clamp_box = Bbox([0,0,0], shape)
-
-    for gx,gy,gz in xyzrange([sgx, sgy, sgz]):
-      bbx = Bbox((gx,gy,gz), (gx+1, gy+1, gz+1))
-      bbx *= graph_chunk_size
-      bbx = Bbox.clamp(bbx, clamp_box)
-
-      slicearr = []
-      for i in range(3):
-        bbx1 = bbx.clone()
-        bbx1.maxpt[i] = bbx1.minpt[i] + 1
-        slicearr.append(bbx1)
-
-        bbx1 = bbx.clone()
-        bbx1.minpt[i] = bbx1.maxpt[i] - 1
-        slicearr.append(bbx1)
-
-      for bbx1 in slicearr:
-        vcg[bbx1.to_slices()] = root_vcg[bbx1.to_slices()] 
-
-    return vcg
-
-  def compute_cross_sectional_area(self, vol, bbox, skeletons):
-    if len(skeletons) == 0:
-      return skeletons
-
-    # Why redownload a bigger image? In order to avoid clipping the
-    # cross sectional areas on the edges.
-    delta = int(self.cross_sectional_area_shape_delta)
-
-    big_bbox = bbox.clone()
-    big_bbox.grow(delta)
-    big_bbox = Bbox.clamp(big_bbox, vol.bounds)
-
-    big_bbox.minpt -= self.hole_filling_padding
-    big_bbox.maxpt += self.hole_filling_padding
-
-    all_labels = vol[big_bbox][...,0]
-
-    delta = bbox.minpt - big_bbox.minpt
-
-    # place the skeletons in exactly the same position
-    # in the enlarged image
-    for skel in skeletons.values():
-      skel.vertices += delta * vol.resolution
-
-    if self.mask_ids:
-      all_labels = fastremap.mask(all_labels, self.mask_ids)
-
-    def do_cross_section(labels):
-      return kimimaro.cross_sectional_area(
-        labels, skeletons,
-        anisotropy=vol.resolution,
-        smoothing_window=self.cross_sectional_area_smoothing_window,
-        progress=self.progress,
-        in_place=True,
-        fill_holes=False,
-      )
-
-    skeletons = self._do_operation(all_labels, do_cross_section)
-    del all_labels
-
-    # move the vertices back to their old smaller image location
-    for skel in skeletons.values():
-      skel.vertices -= delta * vol.resolution
-
-    return self.repair_cross_sectional_area_contacts(vol, bbox, skeletons)
-
-  def repair_cross_sectional_area_contacts(self, vol, bbox, skeletons):
-    from dbscan import DBSCAN
-
-    boundaries = [
-      bbox.minpt.x == vol.bounds.minpt.x,
-      bbox.maxpt.x == vol.bounds.maxpt.x,
-      bbox.minpt.y == vol.bounds.minpt.y,
-      bbox.maxpt.y == vol.bounds.maxpt.y,
-      bbox.minpt.z == vol.bounds.minpt.z,
-      bbox.maxpt.z == vol.bounds.maxpt.z,
-    ]
-
-    if all(boundaries):
-      return skeletons
-
-    invalid_repairs = 0
-    for i, bnd in enumerate(boundaries):
-      invalid_repairs |= (bnd << i)
-
-    invalid_repairs = (~np.uint8(invalid_repairs)) & np.uint8(0b00111111)
-
-    # We want to repair any skeleton that has a contact with the
-    # edge except those that are contacting the volume boundary due to futility
-
-    repair_skels = []
-    for skel in skeletons.values():
-      contacts = skel.cross_sectional_area_contacts & invalid_repairs
-      if np.any(contacts):
-        repair_skels.append(skel)
-
-    delta = int(self.cross_sectional_area_shape_delta)
-
-    shape = bbox.size3()
-    
-    def reprocess_skel(pts, skel):
-      pts_bbx = Bbox.from_points(pts)
-
-      pts_bbx_vol = pts_bbx + bbox.minpt
-      center = pts_bbx_vol.center().astype(int)
-      skel_bbx = Bbox(center, center+1)
-      skel_bbx.grow(delta + shape // 2)
-
-      skel_bbx = Bbox.clamp(skel_bbx, vol.bounds)
-
-      skel_bbx.minpt -= self.hole_filling_padding
-      skel_bbx.maxpt += self.hole_filling_padding
-
-      binary_image = vol.download(
-        skel_bbx, mip=vol.mip, label=skel.id
-      )[...,0]
-
-      diff = bbox.minpt - skel_bbx.minpt
-      skel.vertices += diff * vol.resolution
-
-      # we binarized the label for memory's sake, 
-      # so need to harmonize that with the skeleton ID
-      segid = skel.id
-      skel.id = 1
-
-      if self.fill_holes > 0:
-        binary_image = fastmorph.fill_holes(
-          binary_image,
-          fix_borders=(self.fill_holes >= 2),
-          morphological_closing=(self.fill_holes >= 3),
-        )
-        if self.fill_holes >= 3:
-          hp = self.hole_filling_padding
-          binary_image = np.asfortranarray(binary_image[hp:-hp,hp:-hp,hp:-hp])
-
-      kimimaro.cross_sectional_area(
-        binary_image, skel,
-        anisotropy=vol.resolution,
-        smoothing_window=self.cross_sectional_area_smoothing_window,
-        progress=self.progress,
-        in_place=True,
-        fill_holes=False,
-        repair_contacts=True,
-      )
-      skel.id = segid
-      skel.vertices -= diff * vol.resolution
-
-    for skel in repair_skels:
-      verts = (skel.vertices // vol.resolution).astype(int)
-      reprocess_skel(verts, skel)
-
-      pts = verts[skel.cross_sectional_area_contacts > 0]
-      if len(pts) == 0:
-        continue
-
-      labels, core_samples_mask = DBSCAN(pts, eps=5, min_samples=2)
-      uniq = fastremap.unique(labels)
-      for lbl in uniq:
-        reprocess_skel(pts[labels == lbl], skel)
-
-    return skeletons
-
-  def apply_global_dust_threshold(self, vol, all_labels):
-    path = vol.meta.join(self.cloudpath, vol.key, 'stats', 'voxel_counts.im')
-    cf = CloudFile(path)
-    memcf = CloudFile(path.replace(f"{cf.protocol}://", "mem://"))
-
-    if not cf.exists():
-      raise FileNotFoundError(f"Cannot apply global dust threshold without {path}")
-
-    buf = None
-    if memcf.exists():
-      buf = memcf.get()
-    else:
-      cloudfiles.clear_memory()
-
-    if buf is None:
-      if cf.protocol != "file":
-        buf = cf.get()
-        memcf.put(buf, compress='zstd')
-      else:
-        buf = cf
-
-    mb = IntMap(buf)
-    uniq = fastremap.unique(all_labels)
-
-    valid_objects = []
-    for label in uniq:
-      if label == 0:
-        continue
-      if mb[label] >= self.dust_threshold:
-        valid_objects.append(label)
-
-    return fastremap.mask_except(all_labels, valid_objects)
-
-  def upload_batch(self, vol, path, bbox, skeletons):
-    mbuf = MapBuffer(
-      skeletons, compress="br", 
-      tobytesfn=lambda skel: skel.to_precomputed()
-    )
-
-    cf = CloudFiles(path, progress=vol.progress)
-    cf.put(
-      path="{}.frags".format(bbox.to_filename()),
-      content=mbuf.tobytes(),
-      compress=None,
-      content_type="application/x-mapbuffer",
-      cache_control=False,
-    )
-
-  def upload_individuals(self, vol, path, bbox, skeletons):
-    skeletons = skeletons.values()
-
-    if not self.will_postprocess:
-      vol.skeleton.upload(skeletons)
-      return 
-
-    # Split skeletons at branch points with boundary information
-    all_fragments = []
-    all_boundary_info = []
-    
-    for skel in skeletons:
-      fragments_with_info = split_skeleton_with_boundary_info(skel, bbox)
-      for fragment, boundary_info in fragments_with_info:
-        all_fragments.append(fragment)
-        all_boundary_info.append(boundary_info)
-
-    bbox_scaled = bbox * vol.resolution
-    cf = CloudFiles(path, progress=vol.progress)
-    
-    # Store fragments with their boundary information
-    uploads = []
-    for fragment, boundary_info in zip(all_fragments, all_boundary_info):
-      # Store the fragment
-      fragment_filename = f"{fragment.id}:{bbox_scaled.to_filename()}"
-      uploads.append((fragment_filename, pickle.dumps(fragment)))
-      
-      # Store boundary information separately for merge reconstruction
-      boundary_filename = f"{fragment.id}:{bbox_scaled.to_filename()}.boundary"
-      uploads.append((boundary_filename, pickle.dumps(boundary_info)))
-    
-    cf.puts(uploads, compress='gzip', content_type="application/python-pickle", cache_control=False)
-
-  def upload_spatial_index(self, vol, path, bbox, skeletons):
-    # Create fragment-based spatial index
-    fragment_spatial_index = {}
-    boundary_connections = {}
-    
-    for skel in skeletons.values():
-      fragments_with_info = split_skeleton_with_boundary_info(skel, bbox)
-      
-      for fragment, boundary_info in fragments_with_info:
-        # Index fragment location
-        fragment_bbox = Bbox.from_points(fragment.vertices)
-        fragment_spatial_index[fragment.id] = {
-          'bbox': fragment_bbox.to_list(),
-          'original_segment': boundary_info['original_segment_id'],
-          'chunk_bbox': boundary_info['chunk_bbox']
-        }
-        
-        # Track boundary connections for merge reconstruction
-        if boundary_info['boundary_vertices']:
-          boundary_connections[fragment.id] = {
-            'boundary_vertices': boundary_info['boundary_vertices'],
-            'connections': boundary_info['connections'],
-            'chunk_bbox': boundary_info['chunk_bbox']
-          }
-
-    bbox_scaled = bbox.astype(vol.resolution.dtype) * vol.resolution
-    precision = vol.skeleton.spatial_index.precision
-    cf = CloudFiles(path, progress=vol.progress)
-    
-    # Store fragment spatial index
-    cf.put_json(
-      path=f"{bbox_scaled.to_filename(precision)}.spatial",
-      content=fragment_spatial_index,
-      compress='gzip',
-      cache_control=False,
-    )
-    
-    # Store boundary connection information for merge
-    cf.put_json(
-      path=f"{bbox_scaled.to_filename(precision)}.connections",
-      content=boundary_connections,
-      compress='gzip',
-      cache_control=False,
-    )
-
-class UnshardedSkeletonMergeTask(RegisteredTask):
-  """
-  Stage 2 of skeletonization.
-
-  Merge chunked TEASAR skeletons into a single skeleton.
-
-  If we parallelize using prefixes single digit prefixes ['0','1',..'9'] all meshes will
-  be correctly processed. But if we do ['10','11',..'99'] meshes from [0,9] won't get
-  processed and need to be handle specifically by creating tasks that will process
-  a single mesh ['0:','1:',..'9:']
-  """
-  def __init__(
-      self, cloudpath, prefix, 
-      crop=0, dust_threshold=4000, max_cable_length=None,
-      tick_threshold=6000, delete_fragments=False
-    ):
-    super(UnshardedSkeletonMergeTask, self).__init__(
-      cloudpath, prefix, crop, 
-      dust_threshold, max_cable_length,
-      tick_threshold, delete_fragments
-    )
-    self.max_cable_length = float(max_cable_length) if max_cable_length is not None else None
-
-  def execute(self):
-    self.vol = CloudVolume(self.cloudpath, cdn_cache=False)
-    self.vol.mip = self.vol.skeleton.meta.mip
-
-    fragment_filenames = self.get_filenames()
-    skels = self.get_skeletons_by_segid(fragment_filenames)
-
-    skeletons = []
-    for segid, frags in skels.items():
-      skeleton = self.fuse_skeletons(frags)
-      # if self.max_cable_length is None or skeleton.cable_length() <= self.max_cable_length:
-      #   skeleton = kimimaro.postprocess(
-      #     skeleton, self.dust_threshold, self.tick_threshold
-      #   )
-      skeleton.id = segid
-      skeletons.append(skeleton)
-
-    self.vol.skeleton.upload(skeletons)
-    
-    if self.delete_fragments:
-      cf = CloudFiles(self.cloudpath, progress=True)
-      cf.delete(fragment_filenames)
-
-  def get_filenames(self):
-    prefix = '{}/{}'.format(self.vol.skeleton.path, self.prefix)
-
-    cf = CloudFiles(self.cloudpath, progress=True)
-    return [ _ for _ in cf.list(prefix=prefix) ]
-
-  def get_skeletons_by_segid(self, filenames):
-    cf = CloudFiles(self.cloudpath, progress=False)
-    skels = cf.get(filenames)
-
-    skeletons = defaultdict(list)
-    for skel in skels:
-      try:
-        segid = filename_to_segid(skel['path'])
-      except ValueError:
-        # Typically this is due to preexisting fully
-        # formed skeletons e.g. skeletons_mip_3/1588494
-        continue
-
-      skeletons[segid].append( 
-        (
-          Bbox.from_filename(skel['path']),
-          pickle.loads(skel['content'])
-        )
-      )
-
-    return skeletons
-
-  def fuse_skeletons(self, skels):
-    if len(skels) == 0:
-      return Skeleton()
-
-    bbxs = [ item[0] for item in skels ]
-    skeletons = [ item[1] for item in skels ]
-
-    skeletons = self.crop_skels(bbxs, skeletons)
-    skeletons = [ s for s in skeletons if not s.empty() ]
-
-    if len(skeletons) == 0:
-      return Skeleton()
-
-    return Skeleton.simple_merge(skeletons).consolidate()
-
-  def crop_skels(self, bbxs, skeletons):
-    cropped = [ s.clone() for s in skeletons ]
-
-    if self.crop <= 0:
-      return cropped
-    
-    for i in range(len(skeletons)):
-      bbx = bbxs[i]
-      bbx = bbx.astype(self.vol.resolution.dtype) 
-      bbx.minpt += self.crop * self.vol.resolution
-      bbx.maxpt -= self.crop * self.vol.resolution
-
-      if bbx.volume() <= 0:
-        continue
-
-      cropped[i] = cropped[i].crop(bbx)
-
-    return cropped
-
-class ShardedSkeletonMergeTask(RegisteredTask):
-  def __init__(
-    self, cloudpath, shard_no, 
-    dust_threshold=4000, tick_threshold=6000, frag_path=None, cache=False,
-    spatial_index_db=None, max_cable_length=None
-  ):
-    super(ShardedSkeletonMergeTask, self).__init__(
-      cloudpath, shard_no,  
-      dust_threshold, tick_threshold, frag_path, cache, spatial_index_db,
-      max_cable_length
-    )
-    self.progress = False
-    self.max_cable_length = float(max_cable_length) if max_cable_length is not None else None
-
-  def execute(self):
-    # cache is necessary for local computation, but on GCE download is very fast
-    # so cache isn't necessary.
-    cv = CloudVolume(
-      self.cloudpath, 
-      progress=self.progress,
-      spatial_index_db=self.spatial_index_db,
-      cache=self.cache
-    )
-
-    # This looks messy because we are trying to avoid retaining
-    # unnecessary memory. In the original iteration, this was 
-    # using 50 GB+ memory on minnie65. With changes to this
-    # and the spatial_index, we are getting it down to something reasonable.
-    locations = self.locations_for_labels(
-      labels_for_shard(cv, self.shard_no, self.progress), 
-      cv
-    )
-    filenames = set(itertools.chain(*locations.values()))
-    labels = set(locations.keys())
-    del locations
-    skeletons = self.get_unfused(labels, filenames, cv, self.frag_path)
-    del labels
-    del filenames
-    skeletons = self.process_skeletons(skeletons, in_place=True)
-
-    if len(skeletons) == 0:
-      return
-
-    shard_files = synthesize_shard_files(cv.skeleton.reader.spec, skeletons)
-
-    if len(shard_files) != 1:
-      raise ValueError(
-        "Only one shard file should be generated per task. Expected: {} Got: {} ".format(
-          str(self.shard_no), ", ".join(shard_files.keys())
-      ))
-
-    cf = CloudFiles(cv.skeleton.meta.layerpath, progress=self.progress)
-    cf.puts( 
-      ( (fname, data) for fname, data in shard_files.items() ),
-      compress=False,
-      content_type='application/octet-stream',
-      cache_control='no-cache',      
-    )
-
-  def process_skeletons(self, unfused_skeletons, in_place=False):
-    skeletons = {}
-    if in_place:
-      skeletons = unfused_skeletons
-
-    for label in tqdm(unfused_skeletons.keys(), desc="Postprocessing", disable=(not self.progress)):
-      skels = unfused_skeletons[label]
-      skel = Skeleton.simple_merge(skels)
-      skel.id = label
-      skel.extra_attributes = [ 
-        attr for attr in skel.extra_attributes \
-        if attr['data_type'] == 'float32' 
-      ]
-      skel = skel.consolidate()
-      # if self.max_cable_length is not None and skel.cable_length() > self.max_cable_length:
-      #   skeletons[label] = skel.to_precomputed()
-      # else:
-      #   skeletons[label] = kimimaro.postprocess(
-      #     skel, 
-      #     dust_threshold=self.dust_threshold, # voxels 
-      #     tick_threshold=self.tick_threshold, # nm
-      #   ).to_precomputed()
-      skeletons[label] = skel.to_precomputed()
-
-    return skeletons
-
-  def get_unfused(self, labels, filenames, cv, frag_path):
-    skeldirfn = lambda loc: cv.meta.join(cv.skeleton.meta.skeleton_path, loc)
-    filenames = [ skeldirfn(loc) for loc in filenames ]
-
-    block_size = 50
-
-    if len(filenames) < block_size:
-      blocks = [ filenames ]
-      n_blocks = 1
-    else:
-      n_blocks = max(len(filenames) // block_size, 1)
-      blocks = sip(filenames, block_size)
-
-    frag_prefix = frag_path or cv.cloudpath
-    local_input = False
-    if paths.extract(frag_prefix).protocol == "file":
-       local_input = True
-       frag_prefix = frag_prefix.replace("file://", "", 1)
-
-    all_skels = defaultdict(list)
-    for filenames_block in tqdm(blocks, desc="Filename Block", total=n_blocks, disable=(not self.progress)):
-      if local_input:
-        all_files = {}
-        for filename in filenames_block:
-          all_files[filename] = open(os.path.join(frag_prefix, filename), "rb")
-      else:
-        all_files = { 
-          filename: CloudFile(cv.meta.join(frag_prefix, filename), cache_meta=True)
-          for filename in filenames_block 
-        } 
-      
-      for filename, content in tqdm(all_files.items(), desc="Scanning Fragments", disable=(not self.progress)):
-        fragment = MapBuffer(content, frombytesfn=Skeleton.from_precomputed)
-
-        for label in labels:
-          try:
-            skel = fragment[label]
-            skel.id = label
-            all_skels[label].append(skel)
-          except KeyError:
-            continue
-
-        if hasattr(content, "close"):
-          content.close()
-
-    return all_skels
-
-  def locations_for_labels(self, labels, cv):
-    SPATIAL_EXT = re.compile(r'\.spatial$')
-    index_filenames = cv.skeleton.spatial_index.file_locations_per_label(labels)
-    for label, locations in index_filenames.items():
-      for i, location in enumerate(locations):
-        bbx = Bbox.from_filename(re.sub(SPATIAL_EXT, '', location))
-        bbx /= cv.meta.resolution(cv.skeleton.meta.mip)
-        index_filenames[label][i] = bbx.to_filename() + '.frags'
-    return index_filenames
-
-def labels_for_shard(cv, shard_no, progress):
-  """
-  Try to fetch precalculated labels from `$shardno.labels` (faster) otherwise, 
-  compute which labels are applicable to this shard from the shard index (much slower).
-  """
-  labels = CloudFiles(cv.skeleton.meta.layerpath).get_json(shard_no + '.labels')
-  if labels is not None:
-    return labels
-
-  labels = cv.skeleton.spatial_index.query(cv.bounds * cv.resolution)
-  spec = cv.skeleton.reader.spec
-
-  return [ 
-    lbl for lbl in tqdm(labels, desc="Computing Shard Numbers", disable=(not progress))  \
-    if spec.compute_shard_location(lbl).shard_number == shard_no 
-  ]
-
-@queueable
-def ShardedFromUnshardedSkeletonMergeTask(
-  src:str,
-  dest:str,
-  shard_no:str,
-  cache_control:bool = False,
-  skel_dir:Optional[str] = None,
-  progress:bool = False,
-):
-  cv_src = CloudVolume(src)
-
-  if skel_dir is None and 'skeletons' in cv.info:
-    skel_dir = cv.info['skeletons']
-
-  cv_dest = CloudVolume(dest, skel_dir=skel_dir, progress=progress)
-
-  labels = labels_for_shard(cv_dest, shard_no, progress)
-  skeletons = cv_src.skeleton.get(labels)
-  del labels
-
-  if len(skeletons) == 0:
-    return
-
-  skeletons = strip_integer_attributes(skeletons)
-  skeletons = { skel.id: skel.to_precomputed() for skel in skeletons }
-  shard_files = synthesize_shard_files(cv_dest.skeleton.reader.spec, skeletons)
-
-  if len(shard_files) != 1:
-    raise ValueError(
-      "Only one shard file should be generated per task. Expected: {} Got: {} ".format(
-        str(shard_no), ", ".join(shard_files.keys())
-    ))
-
-  cf = CloudFiles(cv_dest.skeleton.meta.layerpath, progress=progress)
-  cf.puts( 
-    ( (fname, data) for fname, data in shard_files.items() ),
-    compress=False,
-    content_type='application/octet-stream',
-    cache_control='no-cache',      
-  )
-
-@queueable
-def DeleteSkeletonFilesTask(
-  cloudpath:str,
-  prefix:str,
-  skel_dir:Optional[str] = None
-):
-  cv = CloudVolume(cloudpath, skel_dir=skel_dir)
-  cf = CloudFiles(cv.skeleton.meta.layerpath)
-  cf.delete(cf.list(prefix=prefix))
-
-
-@queueable
-def TransferSkeletonFilesTask(
-  src:str,
-  dest:str,
-  prefix:str,
-  skel_dir:Optional[str] = None
-):
-  cv_src = CloudVolume(src)
-  cv_dest = CloudVolume(dest, skel_dir=skel_dir)
-
-  cf_src = CloudFiles(cv_src.skeleton.meta.layerpath)
-  cf_dest = CloudFiles(cv_dest.skeleton.meta.layerpath)
-
-  cf_src.transfer_to(cf_dest, paths=cf_src.list(prefix=prefix))
-
-def split_skeleton_with_boundary_info(skeleton, chunk_bbox):
-  """
-  Split skeleton at branch points while preserving boundary connectivity information.
-  
-  Args:
-    skeleton: CloudVolume Skeleton object
-    chunk_bbox: Bounding box of the current chunk
-    
-  Returns:
-    list: List of (fragment, boundary_info) tuples
-  """
-  if skeleton is None or len(skeleton.vertices) == 0:
-    return []
-    
-  vertices = skeleton.vertices
-  edges = skeleton.edges
-  
-  if len(edges) == 0:
-    boundary_vertices = find_boundary_vertices(vertices, chunk_bbox)
-    boundary_info = {
-      'boundary_vertices': boundary_vertices,
-      'chunk_bbox': chunk_bbox.to_list(),
-      'connections': []
-    }
-    return [(skeleton, boundary_info)]
-  
-  # Build adjacency list
-  adjacency = defaultdict(list)
-  for edge in edges:
-    adjacency[edge[0]].append(edge[1])
-    adjacency[edge[1]].append(edge[0])
-  
-  # Find branch points (degree > 2) and boundary vertices
-  branch_points = []
-  boundary_vertices = find_boundary_vertices(vertices, chunk_bbox)
-  
-  for vertex_idx, neighbors in adjacency.items():
-    if len(neighbors) > 2:
-      branch_points.append(vertex_idx)
-  
-  # If no branch points, return single fragment with boundary info
-  if len(branch_points) == 0:
-    boundary_info = {
-      'boundary_vertices': boundary_vertices,
-      'chunk_bbox': chunk_bbox.to_list(),
-      'connections': []
-    }
-    return [(skeleton, boundary_info)]
-  
-  # Split at branch points and create fragments with boundary tracking
-  fragments_with_info = []
-  visited_edges = set()
-  fragment_id = 0
-  
-  for branch_point in branch_points:
-    neighbors = adjacency[branch_point]
-    
-    for neighbor in neighbors:
-      if (branch_point, neighbor) in visited_edges or (neighbor, branch_point) in visited_edges:
-        continue
-        
-      # Trace path from branch point
-      path_vertices = [branch_point, neighbor]
-      current = neighbor
-      visited_edges.add((branch_point, neighbor))
-      visited_edges.add((neighbor, branch_point))
-      
-      while True:
-        current_neighbors = [n for n in adjacency[current] if n not in path_vertices]
-        if len(current_neighbors) != 1:
-          break
-        next_vertex = current_neighbors[0]
-        path_vertices.append(next_vertex)
-        visited_edges.add((current, next_vertex))
-        visited_edges.add((next_vertex, current))
-        current = next_vertex
-      
-      if len(path_vertices) >= 2:
-        # Create fragment
-        fragment_vertices = vertices[path_vertices]
-        fragment_edges = []
-        for i in range(len(path_vertices) - 1):
-          fragment_edges.append([i, i + 1])
-        
-        fragment = Skeleton(
-          vertices=fragment_vertices,
-          edges=np.array(fragment_edges, dtype=np.uint32) if fragment_edges else np.array([], dtype=np.uint32).reshape(0, 2),
-          radii=skeleton.radii[path_vertices] if skeleton.radii is not None and len(skeleton.radii) > 0 else None,
-          vertex_types=skeleton.vertex_types[path_vertices] if skeleton.vertex_types is not None and len(skeleton.vertex_types) > 0 else None,
-          extra_attributes=[],
-          segid=skeleton.id,
-          space='voxel'
-        )
-        
-        # Create unique fragment ID
-        fragment.id = f"{skeleton.id}_{fragment_id}"
-        fragment_id += 1
-        
-        # Track boundary information for this fragment
-        fragment_boundary_vertices = find_boundary_vertices(fragment_vertices, chunk_bbox)
-        
-        # Track connections to other fragments (for merge reconstruction)
-        connections = []
-        if path_vertices[0] in branch_points:  # Start at branch point
-          connections.append({
-            'vertex_idx': 0,
-            'connects_to': 'branch',
-            'branch_vertex': vertices[path_vertices[0]].tolist()
-          })
-        if path_vertices[-1] in branch_points:  # End at branch point
-          connections.append({
-            'vertex_idx': len(path_vertices) - 1,
-            'connects_to': 'branch',
-            'branch_vertex': vertices[path_vertices[-1]].tolist()
-          })
-        
-        boundary_info = {
-          'boundary_vertices': fragment_boundary_vertices,
-          'chunk_bbox': chunk_bbox.to_list(),
-          'connections': connections,
-          'original_segment_id': skeleton.id,
-          'fragment_id': fragment.id
-        }
-        
-        fragments_with_info.append((fragment, boundary_info))
-  
-  return fragments_with_info if fragments_with_info else [(skeleton, {'boundary_vertices': boundary_vertices, 'chunk_bbox': chunk_bbox.to_list(), 'connections': []})]
-
-def find_boundary_vertices(vertices, chunk_bbox):
-  """Find vertices that are on or near chunk boundaries."""
-  boundary_vertices = []
-  tolerance = 1.0  # 1 voxel tolerance
-  
-  for i, vertex in enumerate(vertices):
-    x, y, z = vertex
-    minx, miny, minz = chunk_bbox.minpt
-    maxx, maxy, maxz = chunk_bbox.maxpt
-    
-    # Check if vertex is within tolerance of any boundary
-    if (abs(x - minx) <= tolerance or abs(x - maxx) <= tolerance or
-        abs(y - miny) <= tolerance or abs(y - maxy) <= tolerance or
-        abs(z - minz) <= tolerance or abs(z - maxz) <= tolerance):
-      boundary_vertices.append({
-        'vertex_idx': i,
-        'vertex_pos': vertex.tolist(),
-        'boundary_faces': []
-      })
-      
-      # Track which faces this vertex is near
-      if abs(x - minx) <= tolerance:
-        boundary_vertices[-1]['boundary_faces'].append('x_min')
-      if abs(x - maxx) <= tolerance:
-        boundary_vertices[-1]['boundary_faces'].append('x_max')
-      if abs(y - miny) <= tolerance:
-        boundary_vertices[-1]['boundary_faces'].append('y_min')
-      if abs(y - maxy) <= tolerance:
-        boundary_vertices[-1]['boundary_faces'].append('y_max')
-      if abs(z - minz) <= tolerance:
-        boundary_vertices[-1]['boundary_faces'].append('z_min')
-      if abs(z - maxz) <= tolerance:
-        boundary_vertices[-1]['boundary_faces'].append('z_max')
-  
-  return boundary_vertices
-
-class FragmentAwareSkeletonMergeTask(RegisteredTask):
-  """
-  Modified merge task that handles pre-split skeleton fragments.
-  Reconstructs skeletons by connecting fragments across chunk boundaries
-  while maintaining branch point splits.
-  """
-  def __init__(
-    self, cloudpath, shard_no, 
-    dust_threshold=4000, tick_threshold=6000, frag_path=None, cache=False,
-    spatial_index_db=None, max_cable_length=None, target_segment_id=None
-  ):
-    super(FragmentAwareSkeletonMergeTask, self).__init__(
-      cloudpath, shard_no,  
-      dust_threshold, tick_threshold, frag_path, cache, spatial_index_db,
-      max_cable_length, target_segment_id
-    )
-    self.progress = False
-    self.max_cable_length = float(max_cable_length) if max_cable_length is not None else None
-    self.target_segment_id = target_segment_id
-
-  def execute(self):
-    cv = CloudVolume(
-      self.cloudpath, 
-      progress=self.progress,
-      spatial_index_db=self.spatial_index_db,
-      cache=self.cache
-    )
-
-    # Get fragments for the target segment
-    fragment_locations = self.get_fragment_locations_for_segment(cv, self.target_segment_id)
-    
-    # Load fragments and boundary information
-    fragments_with_boundaries = self.load_fragments_with_boundaries(cv, fragment_locations)
-    
-    # Process fragments in batches to manage memory
-    connected_components = self.connect_fragments_across_boundaries(fragments_with_boundaries)
-    
-    # Create final skeleton trees (one per connected component)
-    final_skeletons = {}
-    for comp_id, component_fragments in connected_components.items():
-      if len(component_fragments) > 0:
-        # Each connected component becomes a separate skeleton tree
-        merged_skeleton = self.merge_connected_fragments(component_fragments)
-        final_skeletons[f"{self.target_segment_id}_{comp_id}"] = merged_skeleton
-
-    if len(final_skeletons) == 0:
-      return
-
-    # Store results
-    shard_files = synthesize_shard_files(cv.skeleton.reader.spec, final_skeletons)
-    cf = CloudFiles(cv.skeleton.meta.layerpath, progress=self.progress)
-    cf.puts( 
-      ( (fname, data) for fname, data in shard_files.items() ),
-      compress=False,
-      content_type='application/octet-stream',
-      cache_control='no-cache',      
-    )
-
-  def get_fragment_locations_for_segment(self, cv, segment_id):
-    """Find all chunks containing fragments of the target segment."""
-    all_locations = []
-    
-    # Query all spatial index files to find fragment locations
-    # This would need to be implemented based on your specific setup
-    # For now, assuming you have a way to query fragment locations
-    
-    return all_locations
-
-  def load_fragments_with_boundaries(self, cv, fragment_locations):
-    """Load fragments and their boundary information."""
-    fragments_with_boundaries = []
-    
-    for location in fragment_locations:
-      try:
-        # Load fragment
-        fragment_file = CloudFile(cv.meta.join(cv.cloudpath, location))
-        fragment = pickle.loads(fragment_file.get())
-        
-        # Load boundary information
-        boundary_file = CloudFile(cv.meta.join(cv.cloudpath, location + ".boundary"))
-        boundary_info = pickle.loads(boundary_file.get())
-        
-        fragments_with_boundaries.append((fragment, boundary_info))
-      except Exception as e:
-        print(f"Error loading fragment {location}: {e}")
-        continue
-    
-    return fragments_with_boundaries
-
-  def connect_fragments_across_boundaries(self, fragments_with_boundaries):
-    """
-    Group fragments into connected components based on boundary connections.
-    Fragments that connect across chunk boundaries are grouped together.
-    """
-    from collections import defaultdict
-    import networkx as nx
-    
-    # Build connectivity graph
-    G = nx.Graph()
-    fragment_map = {}
-    
-    for i, (fragment, boundary_info) in enumerate(fragments_with_boundaries):
-      fragment_id = fragment.id
-      G.add_node(fragment_id)
-      fragment_map[fragment_id] = (fragment, boundary_info)
-      
-      # Connect fragments that share boundary vertices
-      for other_i, (other_fragment, other_boundary_info) in enumerate(fragments_with_boundaries):
-        if i >= other_i:
-          continue
-          
-        if self.fragments_connect_at_boundary(boundary_info, other_boundary_info):
-          G.add_edge(fragment_id, other_fragment.id)
-    
-    # Find connected components
-    connected_components = {}
-    for comp_id, component in enumerate(nx.connected_components(G)):
-      connected_components[comp_id] = [
-        fragment_map[frag_id] for frag_id in component
-      ]
-    
-    return connected_components
-
-  def fragments_connect_at_boundary(self, boundary_info1, boundary_info2):
-    """Check if two fragments connect at chunk boundaries."""
-    tolerance = 2.0  # voxel tolerance for boundary matching
-    
-    for bv1 in boundary_info1.get('boundary_vertices', []):
-      for bv2 in boundary_info2.get('boundary_vertices', []):
-        pos1 = np.array(bv1['vertex_pos'])
-        pos2 = np.array(bv2['vertex_pos'])
-        
-        if np.linalg.norm(pos1 - pos2) <= tolerance:
-          # Check if they're on adjacent chunk boundaries
-          faces1 = set(bv1['boundary_faces'])
-          faces2 = set(bv2['boundary_faces'])
-          
-          # Adjacent faces (e.g., x_max connects to x_min)
-          adjacent_pairs = [
-            ('x_max', 'x_min'), ('x_min', 'x_max'),
-            ('y_max', 'y_min'), ('y_min', 'y_max'),
-            ('z_max', 'z_min'), ('z_min', 'z_max')
-          ]
-          
-          for face1 in faces1:
-            for face2 in faces2:
-              if (face1, face2) in adjacent_pairs:
-                return True
-    
-    return False
-
-  def merge_connected_fragments(self, component_fragments):
-    """Merge fragments in a connected component into a single skeleton."""
-    fragments = [frag for frag, _ in component_fragments]
-    
-    # Use simple merge for now - could be optimized for better branch handling
-    if len(fragments) == 1:
-      return fragments[0]
-    
-    # Batch merge to control memory usage
-    batch_size = 50
-    while len(fragments) > 1:
-      next_batch = []
-      for i in range(0, len(fragments), batch_size):
-        batch = fragments[i:i + batch_size]
-        if len(batch) == 1:
-          next_batch.append(batch[0])
-        else:
-          merged = Skeleton.simple_merge(batch)
-          next_batch.append(merged)
-      fragments = next_batch
-    
-    return fragments[0]
diff --git a/igneous/tasks/skeleton_ori.py b/igneous/tasks/skeleton_ori.py
deleted file mode 100755
index f3261076..00000000
--- a/igneous/tasks/skeleton_ori.py
+++ /dev/null
@@ -1,914 +0,0 @@
-from typing import Optional, Sequence, Dict, List
-
-from functools import reduce
-import itertools
-import json
-import mmap
-import pickle
-import posixpath
-import os
-import re
-from collections import defaultdict
-
-from tqdm import tqdm
-
-import numpy as np
-
-import mapbuffer
-from mapbuffer import MapBuffer, IntMap
-import cloudfiles
-from cloudfiles import CloudFiles, CloudFile
-
-import cloudvolume
-from cloudvolume import CloudVolume, Skeleton, paths
-from cloudvolume.lib import Vec, Bbox, sip, xyzrange
-from cloudvolume.datasource.precomputed.sharding import synthesize_shard_files
-
-import cc3d
-import crackle
-import fastmorph
-import fastremap
-import kimimaro
-
-from taskqueue import RegisteredTask, queueable
-
-SEGIDRE = re.compile(r'/(\d+):.*?$')
-
-def filename_to_segid(filename):
-  matches = SEGIDRE.search(filename)
-  if matches is None:
-    raise ValueError("There was an issue with the fragment filename: " + filename)
-
-  segid, = matches.groups()
-  return int(segid)
-
-def strip_integer_attributes(skeletons):
-  for skel in skeletons:
-    skel.extra_attributes = [ 
-    attr for attr in skel.extra_attributes 
-    if attr['data_type'] in ('float32', 'float64')
-  ]
-  return skeletons
-
-class SkeletonTask(RegisteredTask):
-  """
-  Stage 1 of skeletonization.
-
-  Convert chunks of segmentation into chunked skeletons and point clouds.
-  They will be merged in the stage 2 task SkeletonMergeTask.
-  """
-  def __init__(
-    self, cloudpath:str, 
-    shape:Sequence[int], offset:Sequence[int], 
-    mip:int, teasar_params:dict, will_postprocess:bool,
-    info:dict = None, 
-    object_ids:Optional[Sequence[int]] = None,
-    mask_ids:Optional[Sequence[int]] = None,
-    fix_branching:bool = True,
-    fix_borders:bool = True,
-    fix_avocados:bool = False,
-    fill_holes:int = 0,
-    dust_threshold:int = 1000, 
-    progress:bool = False,
-    parallel:int = 1,
-    fill_missing:bool = False,
-    sharded:bool = False,
-    frag_path:Optional[str] = None, 
-    spatial_index:bool = True,
-    spatial_grid_shape:Optional[Sequence[int]] = None,
-    synapses:Optional[Sequence[Sequence[float]]] = None, 
-    dust_global:bool = False,
-    cross_sectional_area:bool = False,
-    cross_sectional_area_smoothing_window:int = 1,
-    cross_sectional_area_shape_delta:int = 150,
-    dry_run:bool = False,
-    strip_integer_attributes:bool = True,
-    fix_autapses:bool = False,
-    timestamp:Optional[int] = None,
-    root_ids_cloudpath:Optional[str] = None,
-  ):
-    super().__init__(
-      cloudpath, shape, offset, mip, 
-      teasar_params, will_postprocess, 
-      info, object_ids, mask_ids,
-      fix_branching, fix_borders, 
-      fix_avocados, fill_holes,
-      dust_threshold, progress, parallel,
-      fill_missing, bool(sharded), frag_path, bool(spatial_index),
-      spatial_grid_shape, synapses, bool(dust_global),
-      bool(cross_sectional_area), int(cross_sectional_area_smoothing_window),
-      int(cross_sectional_area_shape_delta),
-      bool(dry_run), bool(strip_integer_attributes),
-      bool(fix_autapses), timestamp,
-      root_ids_cloudpath,
-    )
-    if isinstance(self.frag_path, str):
-      self.frag_path = cloudfiles.paths.normalize(self.frag_path)
-    self.bounds = Bbox(offset, Vec(*shape) + Vec(*offset))
-    self.index_bounds = Bbox(offset, Vec(*spatial_grid_shape) + Vec(*offset))
-
-    # aggressive morphological hole filling has a 1-2vx 
-    # edge effect that needs to be cropped away
-    self.hole_filling_padding = (self.fill_holes >= 3) * 2
-
-  def execute(self):
-    # For graphene volumes, if we've materialized the root IDs
-    # into a static archive, let's use that because it's way more
-    # efficient for fetching root IDs.
-    cloudpath = self.cloudpath
-    if self.root_ids_cloudpath:
-      cloudpath = self.root_ids_cloudpath
-
-    lru_bytes = 0
-    lru_encoding = 'same'
-
-    if self.cross_sectional_area:
-      lru_bytes = self.bounds.size() + 2 * self.cross_sectional_area_shape_delta
-      lru_bytes = lru_bytes[0] * lru_bytes[1] * lru_bytes[2] * 8 // 500
-      lru_encoding = 'crackle'
-
-    vol = CloudVolume(
-      cloudpath,
-      mip=self.mip,
-      bounded=(self.hole_filling_padding == 0),
-      info=self.info,
-      cdn_cache=False,
-      parallel=self.parallel,
-      fill_missing=self.fill_missing,
-      lru_bytes=lru_bytes,
-      lru_encoding=lru_encoding,
-    )
-    bbox = Bbox.clamp(self.bounds, vol.bounds)
-    index_bbox = Bbox.clamp(self.index_bounds, vol.bounds)
-
-    bbox.minpt -= self.hole_filling_padding
-    bbox.maxpt += self.hole_filling_padding
-
-    path = vol.info.get("skeletons", "skeletons")
-    if self.frag_path is None:
-      path = vol.meta.join(self.cloudpath, path)
-    else:
-      # if the path is to a volume root, follow the info instructions,
-      # otherwise place the files exactly where frag path says to
-      test_path = CloudFiles(self.frag_path).join(self.frag_path, "info")
-      test_info = CloudFile(test_path).get_json()
-      if test_info is not None and 'scales' in test_info:
-        path = CloudFiles(self.frag_path).join(self.frag_path, path)
-      else:
-        path = self.frag_path
-
-    all_labels = vol.download(
-      bbox.to_slices(), 
-      agglomerate=True, 
-      timestamp=self.timestamp
-    )
-    all_labels = all_labels[:,:,:,0]
-
-    if self.mask_ids:
-      all_labels = fastremap.mask(all_labels, self.mask_ids)
-
-    extra_targets_after = {}
-    if self.synapses:
-      extra_targets_after = kimimaro.synapses_to_targets(
-        all_labels, self.synapses
-      )
-
-    dust_threshold = self.dust_threshold
-    if self.dust_global and dust_threshold > 0:
-      dust_threshold = 0
-      all_labels = self.apply_global_dust_threshold(vol, all_labels)
-
-    if self.fill_holes and self.fix_autapses:
-      raise ValueError("fill_holes is not currently compatible with fix_autapses")
-
-    voxel_graph = None
-    if self.fix_autapses:
-      voxel_graph = self.voxel_connectivity_graph(vol, bbox, all_labels)
-
-    skeletons = self.skeletonize(
-      all_labels, 
-      vol, 
-      dust_threshold, 
-      extra_targets_after, 
-      voxel_graph,
-    )
-    del all_labels
-
-    if self.cross_sectional_area: # This is expensive!
-      skeletons = self.compute_cross_sectional_area(vol, bbox, skeletons)
-
-    # voxel centered (+0.5) and uses more accurate bounding box from mip 0
-    corrected_offset = (bbox.minpt.astype(np.float32) - vol.meta.voxel_offset(self.mip) + 0.5) * vol.meta.resolution(self.mip)
-    corrected_offset += vol.meta.voxel_offset(0) * vol.meta.resolution(0)
-
-    for segid, skel in skeletons.items():
-      skel.vertices[:] += corrected_offset
-
-    if self.synapses:
-      for segid, skel in skeletons.items():
-        terminal_nodes = skel.vertices[ skel.terminals() ]
-
-        for i, vert in enumerate(terminal_nodes):
-          vert = vert / vol.resolution - self.bounds.minpt
-          vert = tuple(np.round(vert).astype(int))
-          if vert in extra_targets_after.keys():
-            skel.vertex_types[i] = extra_targets_after[vert]
-    
-    # old versions of neuroglancer don't
-    # support int attributes
-    if self.strip_integer_attributes:
-      strip_integer_attributes(skeletons.values())
-
-    if self.dry_run:
-      return skeletons
-
-    if self.sharded:
-      self.upload_batch(vol, path, index_bbox, skeletons)
-    else:
-      self.upload_individuals(vol, path, bbox, skeletons)
-
-    if self.spatial_index:
-      self.upload_spatial_index(vol, path, index_bbox, skeletons)
-
-  def _do_operation(self, all_labels, fn):
-    if self.fill_holes > 0:
-      filled_labels, hole_labels = fastmorph.fill_holes(
-        all_labels,
-        remove_enclosed=True,
-        return_removed=True,
-        fix_borders=(self.fill_holes >= 2),
-        morphological_closing=(self.fill_holes >= 3),
-      )
-
-      if self.fill_holes >= 3:
-        hp = self.hole_filling_padding
-        all_labels = np.asfortranarray(all_labels[hp:-hp,hp:-hp,hp:-hp])
-        filled_labels= np.asfortranarray(filled_labels[hp:-hp,hp:-hp,hp:-hp])
-
-      all_labels = crackle.compress(all_labels)
-      skeletons = fn(filled_labels)
-      del filled_labels
-
-      all_labels = crackle.decompress(all_labels)
-      hole_labels = all_labels * np.isin(all_labels, list(hole_labels))
-      del all_labels
-
-      hole_skeletons = fn(hole_labels)
-      skeletons.update(hole_skeletons)
-      del hole_labels
-      del hole_skeletons
-    else:
-      skeletons = fn(all_labels)
-
-    return skeletons
-
-  def skeletonize(
-    self, 
-    all_labels:np.ndarray, 
-    vol:CloudVolume, 
-    dust_threshold:int, 
-    extra_targets_after:dict, 
-    voxel_graph:np.ndarray,
-  ) -> dict:
-    def do_skeletonize(labels):
-      return kimimaro.skeletonize(
-        labels, self.teasar_params, 
-        object_ids=self.object_ids, 
-        anisotropy=vol.resolution,
-        dust_threshold=dust_threshold, 
-        progress=self.progress, 
-        fix_branching=self.fix_branching,
-        fix_borders=self.fix_borders,
-        fix_avocados=self.fix_avocados,
-        fill_holes=False, # moved this logic into SkeletonTask / fastmorph
-        parallel=self.parallel,
-        extra_targets_after=extra_targets_after.keys(),
-        voxel_graph=voxel_graph,
-      )
-
-    return self._do_operation(all_labels, do_skeletonize)
-
-  def voxel_connectivity_graph(
-    self, 
-    vol:CloudVolume, 
-    bbox:Bbox, 
-    root_labels:np.ndarray,
-  ) -> np.ndarray:
-
-    if vol.meta.path.format != "graphene":
-      vol = CloudVolume(
-        self.cloudpath, mip=self.mip, 
-        info=self.info, cdn_cache=False,
-        parallel=self.parallel, 
-        fill_missing=self.fill_missing,
-      )
-
-    if vol.meta.path.format != "graphene":
-      raise ValueError("Can't extract a voxel connectivity graph from non-graphene volumes.")
-
-    layer_2 = vol.download(
-      bbox, 
-      stop_layer=2,
-      agglomerate=True,
-      timestamp=self.timestamp,
-    )[...,0]
-
-    graph_chunk_size = np.array(vol.meta.graph_chunk_size) / vol.meta.downsample_ratio(vol.mip)
-    graph_chunk_size = graph_chunk_size.astype(int)
-
-    shape = bbox.size()[:3]
-    sgx, sgy, sgz = list(np.ceil(shape / graph_chunk_size).astype(int))
-
-    vcg = cc3d.voxel_connectivity_graph(layer_2, connectivity=26)
-    del layer_2
-
-    # the proper way to do this would be to get the lowest the L3..LN root
-    # as needed, but the lazy way to do this is to get the root labels
-    # which will retain a few errors, but overall the error rate should be
-    # over 100x less. We need to shade in the sides of the connectivity graph
-    # with edges that represent the connections between the adjacent boxes.
-
-    root_vcg = cc3d.voxel_connectivity_graph(root_labels, connectivity=26)
-    clamp_box = Bbox([0,0,0], shape)
-
-    for gx,gy,gz in xyzrange([sgx, sgy, sgz]):
-      bbx = Bbox((gx,gy,gz), (gx+1, gy+1, gz+1))
-      bbx *= graph_chunk_size
-      bbx = Bbox.clamp(bbx, clamp_box)
-
-      slicearr = []
-      for i in range(3):
-        bbx1 = bbx.clone()
-        bbx1.maxpt[i] = bbx1.minpt[i] + 1
-        slicearr.append(bbx1)
-
-        bbx1 = bbx.clone()
-        bbx1.minpt[i] = bbx1.maxpt[i] - 1
-        slicearr.append(bbx1)
-
-      for bbx1 in slicearr:
-        vcg[bbx1.to_slices()] = root_vcg[bbx1.to_slices()] 
-
-    return vcg
-
-  def compute_cross_sectional_area(self, vol, bbox, skeletons):
-    if len(skeletons) == 0:
-      return skeletons
-
-    # Why redownload a bigger image? In order to avoid clipping the
-    # cross sectional areas on the edges.
-    delta = int(self.cross_sectional_area_shape_delta)
-
-    big_bbox = bbox.clone()
-    big_bbox.grow(delta)
-    big_bbox = Bbox.clamp(big_bbox, vol.bounds)
-
-    big_bbox.minpt -= self.hole_filling_padding
-    big_bbox.maxpt += self.hole_filling_padding
-
-    all_labels = vol[big_bbox][...,0]
-
-    delta = bbox.minpt - big_bbox.minpt
-
-    # place the skeletons in exactly the same position
-    # in the enlarged image
-    for skel in skeletons.values():
-      skel.vertices += delta * vol.resolution
-
-    if self.mask_ids:
-      all_labels = fastremap.mask(all_labels, self.mask_ids)
-
-    def do_cross_section(labels):
-      return kimimaro.cross_sectional_area(
-        labels, skeletons,
-        anisotropy=vol.resolution,
-        smoothing_window=self.cross_sectional_area_smoothing_window,
-        progress=self.progress,
-        in_place=True,
-        fill_holes=False,
-      )
-
-    skeletons = self._do_operation(all_labels, do_cross_section)
-    del all_labels
-
-    # move the vertices back to their old smaller image location
-    for skel in skeletons.values():
-      skel.vertices -= delta * vol.resolution
-
-    return self.repair_cross_sectional_area_contacts(vol, bbox, skeletons)
-
-  def repair_cross_sectional_area_contacts(self, vol, bbox, skeletons):
-    from dbscan import DBSCAN
-
-    boundaries = [
-      bbox.minpt.x == vol.bounds.minpt.x,
-      bbox.maxpt.x == vol.bounds.maxpt.x,
-      bbox.minpt.y == vol.bounds.minpt.y,
-      bbox.maxpt.y == vol.bounds.maxpt.y,
-      bbox.minpt.z == vol.bounds.minpt.z,
-      bbox.maxpt.z == vol.bounds.maxpt.z,
-    ]
-
-    if all(boundaries):
-      return skeletons
-
-    invalid_repairs = 0
-    for i, bnd in enumerate(boundaries):
-      invalid_repairs |= (bnd << i)
-
-    invalid_repairs = (~np.uint8(invalid_repairs)) & np.uint8(0b00111111)
-
-    # We want to repair any skeleton that has a contact with the
-    # edge except those that are contacting the volume boundary due to futility
-
-    repair_skels = []
-    for skel in skeletons.values():
-      contacts = skel.cross_sectional_area_contacts & invalid_repairs
-      if np.any(contacts):
-        repair_skels.append(skel)
-
-    delta = int(self.cross_sectional_area_shape_delta)
-
-    shape = bbox.size3()
-    
-    def reprocess_skel(pts, skel):
-      pts_bbx = Bbox.from_points(pts)
-
-      pts_bbx_vol = pts_bbx + bbox.minpt
-      center = pts_bbx_vol.center().astype(int)
-      skel_bbx = Bbox(center, center+1)
-      skel_bbx.grow(delta + shape // 2)
-
-      skel_bbx = Bbox.clamp(skel_bbx, vol.bounds)
-
-      skel_bbx.minpt -= self.hole_filling_padding
-      skel_bbx.maxpt += self.hole_filling_padding
-
-      binary_image = vol.download(
-        skel_bbx, mip=vol.mip, label=skel.id
-      )[...,0]
-
-      diff = bbox.minpt - skel_bbx.minpt
-      skel.vertices += diff * vol.resolution
-
-      # we binarized the label for memory's sake, 
-      # so need to harmonize that with the skeleton ID
-      segid = skel.id
-      skel.id = 1
-
-      if self.fill_holes > 0:
-        binary_image = fastmorph.fill_holes(
-          binary_image,
-          fix_borders=(self.fill_holes >= 2),
-          morphological_closing=(self.fill_holes >= 3),
-        )
-        if self.fill_holes >= 3:
-          hp = self.hole_filling_padding
-          binary_image = np.asfortranarray(binary_image[hp:-hp,hp:-hp,hp:-hp])
-
-      kimimaro.cross_sectional_area(
-        binary_image, skel,
-        anisotropy=vol.resolution,
-        smoothing_window=self.cross_sectional_area_smoothing_window,
-        progress=self.progress,
-        in_place=True,
-        fill_holes=False,
-        repair_contacts=True,
-      )
-      skel.id = segid
-      skel.vertices -= diff * vol.resolution
-
-    for skel in repair_skels:
-      verts = (skel.vertices // vol.resolution).astype(int)
-      reprocess_skel(verts, skel)
-
-      pts = verts[skel.cross_sectional_area_contacts > 0]
-      if len(pts) == 0:
-        continue
-
-      labels, core_samples_mask = DBSCAN(pts, eps=5, min_samples=2)
-      uniq = fastremap.unique(labels)
-      for lbl in uniq:
-        reprocess_skel(pts[labels == lbl], skel)
-
-    return skeletons
-
-  def apply_global_dust_threshold(self, vol, all_labels):
-    path = vol.meta.join(self.cloudpath, vol.key, 'stats', 'voxel_counts.im')
-    cf = CloudFile(path)
-    memcf = CloudFile(path.replace(f"{cf.protocol}://", "mem://"))
-
-    if not cf.exists():
-      raise FileNotFoundError(f"Cannot apply global dust threshold without {path}")
-
-    buf = None
-    if memcf.exists():
-      buf = memcf.get()
-    else:
-      cloudfiles.clear_memory()
-
-    if buf is None:
-      if cf.protocol != "file":
-        buf = cf.get()
-        memcf.put(buf, compress='zstd')
-      else:
-        buf = cf
-
-    mb = IntMap(buf)
-    uniq = fastremap.unique(all_labels)
-
-    valid_objects = []
-    for label in uniq:
-      if label == 0:
-        continue
-      if mb[label] >= self.dust_threshold:
-        valid_objects.append(label)
-
-    return fastremap.mask_except(all_labels, valid_objects)
-
-  def upload_batch(self, vol, path, bbox, skeletons):
-    mbuf = MapBuffer(
-      skeletons, compress="br", 
-      tobytesfn=lambda skel: skel.to_precomputed()
-    )
-
-    cf = CloudFiles(path, progress=vol.progress)
-    cf.put(
-      path="{}.frags".format(bbox.to_filename()),
-      content=mbuf.tobytes(),
-      compress=None,
-      content_type="application/x-mapbuffer",
-      cache_control=False,
-    )
-
-  def upload_individuals(self, vol, path, bbox, skeletons):
-    skeletons = skeletons.values()
-
-    if not self.will_postprocess:
-      vol.skeleton.upload(skeletons)
-      return 
-
-    bbox = bbox * vol.resolution
-    cf = CloudFiles(path, progress=vol.progress)
-    cf.puts(
-      (
-        (
-          f"{skel.id}:{bbox.to_filename()}",
-          pickle.dumps(skel)
-        )
-        for skel in skeletons
-      ),
-      compress='gzip',
-      content_type="application/python-pickle",
-      cache_control=False,
-    )
-
-  def upload_spatial_index(self, vol, path, bbox, skeletons):
-    spatial_index = {}
-    for segid, skel in tqdm(skeletons.items(), disable=(not vol.progress), desc="Extracting Bounding Boxes"):
-      segid_bbx = Bbox.from_points( skel.vertices )
-      spatial_index[segid] = segid_bbx.to_list()
-
-    bbox = bbox.astype(vol.resolution.dtype) * vol.resolution
-    precision = vol.skeleton.spatial_index.precision
-    cf = CloudFiles(path, progress=vol.progress)
-    cf.put_json(
-      path=f"{bbox.to_filename(precision)}.spatial",
-      content=spatial_index,
-      compress='gzip',
-      cache_control=False,
-    )
-
-class UnshardedSkeletonMergeTask(RegisteredTask):
-  """
-  Stage 2 of skeletonization.
-
-  Merge chunked TEASAR skeletons into a single skeleton.
-
-  If we parallelize using prefixes single digit prefixes ['0','1',..'9'] all meshes will
-  be correctly processed. But if we do ['10','11',..'99'] meshes from [0,9] won't get
-  processed and need to be handle specifically by creating tasks that will process
-  a single mesh ['0:','1:',..'9:']
-  """
-  def __init__(
-      self, cloudpath, prefix, 
-      crop=0, dust_threshold=4000, max_cable_length=None,
-      tick_threshold=6000, delete_fragments=False
-    ):
-    super(UnshardedSkeletonMergeTask, self).__init__(
-      cloudpath, prefix, crop, 
-      dust_threshold, max_cable_length,
-      tick_threshold, delete_fragments
-    )
-    self.max_cable_length = float(max_cable_length) if max_cable_length is not None else None
-
-  def execute(self):
-    self.vol = CloudVolume(self.cloudpath, cdn_cache=False)
-    self.vol.mip = self.vol.skeleton.meta.mip
-
-    fragment_filenames = self.get_filenames()
-    skels = self.get_skeletons_by_segid(fragment_filenames)
-
-    skeletons = []
-    for segid, frags in skels.items():
-      skeleton = self.fuse_skeletons(frags)
-      # if self.max_cable_length is None or skeleton.cable_length() <= self.max_cable_length:
-      #   skeleton = kimimaro.postprocess(
-      #     skeleton, self.dust_threshold, self.tick_threshold
-      #   )
-      skeleton.id = segid
-      skeletons.append(skeleton)
-
-    self.vol.skeleton.upload(skeletons)
-    
-    if self.delete_fragments:
-      cf = CloudFiles(self.cloudpath, progress=True)
-      cf.delete(fragment_filenames)
-
-  def get_filenames(self):
-    prefix = '{}/{}'.format(self.vol.skeleton.path, self.prefix)
-
-    cf = CloudFiles(self.cloudpath, progress=True)
-    return [ _ for _ in cf.list(prefix=prefix) ]
-
-  def get_skeletons_by_segid(self, filenames):
-    cf = CloudFiles(self.cloudpath, progress=False)
-    skels = cf.get(filenames)
-
-    skeletons = defaultdict(list)
-    for skel in skels:
-      try:
-        segid = filename_to_segid(skel['path'])
-      except ValueError:
-        # Typically this is due to preexisting fully
-        # formed skeletons e.g. skeletons_mip_3/1588494
-        continue
-
-      skeletons[segid].append( 
-        (
-          Bbox.from_filename(skel['path']),
-          pickle.loads(skel['content'])
-        )
-      )
-
-    return skeletons
-
-  def fuse_skeletons(self, skels):
-    if len(skels) == 0:
-      return Skeleton()
-
-    bbxs = [ item[0] for item in skels ]
-    skeletons = [ item[1] for item in skels ]
-
-    skeletons = self.crop_skels(bbxs, skeletons)
-    skeletons = [ s for s in skeletons if not s.empty() ]
-
-    if len(skeletons) == 0:
-      return Skeleton()
-
-    return Skeleton.simple_merge(skeletons).consolidate()
-
-  def crop_skels(self, bbxs, skeletons):
-    cropped = [ s.clone() for s in skeletons ]
-
-    if self.crop <= 0:
-      return cropped
-    
-    for i in range(len(skeletons)):
-      bbx = bbxs[i]
-      bbx = bbx.astype(self.vol.resolution.dtype) 
-      bbx.minpt += self.crop * self.vol.resolution
-      bbx.maxpt -= self.crop * self.vol.resolution
-
-      if bbx.volume() <= 0:
-        continue
-
-      cropped[i] = cropped[i].crop(bbx)
-
-    return cropped
-
-class ShardedSkeletonMergeTask(RegisteredTask):
-  def __init__(
-    self, cloudpath, shard_no, 
-    dust_threshold=4000, tick_threshold=6000, frag_path=None, cache=False,
-    spatial_index_db=None, max_cable_length=None
-  ):
-    super(ShardedSkeletonMergeTask, self).__init__(
-      cloudpath, shard_no,  
-      dust_threshold, tick_threshold, frag_path, cache, spatial_index_db,
-      max_cable_length
-    )
-    self.progress = False
-    self.max_cable_length = float(max_cable_length) if max_cable_length is not None else None
-
-  def execute(self):
-    # cache is necessary for local computation, but on GCE download is very fast
-    # so cache isn't necessary.
-    cv = CloudVolume(
-      self.cloudpath, 
-      progress=self.progress,
-      spatial_index_db=self.spatial_index_db,
-      cache=self.cache
-    )
-
-    # This looks messy because we are trying to avoid retaining
-    # unnecessary memory. In the original iteration, this was 
-    # using 50 GB+ memory on minnie65. With changes to this
-    # and the spatial_index, we are getting it down to something reasonable.
-    locations = self.locations_for_labels(
-      labels_for_shard(cv, self.shard_no, self.progress), 
-      cv
-    )
-    filenames = set(itertools.chain(*locations.values()))
-    labels = set(locations.keys())
-    del locations
-    skeletons = self.get_unfused(labels, filenames, cv, self.frag_path)
-    del labels
-    del filenames
-    skeletons = self.process_skeletons(skeletons, in_place=True)
-
-    if len(skeletons) == 0:
-      return
-
-    shard_files = synthesize_shard_files(cv.skeleton.reader.spec, skeletons)
-
-    if len(shard_files) != 1:
-      raise ValueError(
-        "Only one shard file should be generated per task. Expected: {} Got: {} ".format(
-          str(self.shard_no), ", ".join(shard_files.keys())
-      ))
-
-    cf = CloudFiles(cv.skeleton.meta.layerpath, progress=self.progress)
-    cf.puts( 
-      ( (fname, data) for fname, data in shard_files.items() ),
-      compress=False,
-      content_type='application/octet-stream',
-      cache_control='no-cache',      
-    )
-
-  def process_skeletons(self, unfused_skeletons, in_place=False):
-    skeletons = {}
-    if in_place:
-      skeletons = unfused_skeletons
-
-    for label in tqdm(unfused_skeletons.keys(), desc="Postprocessing", disable=(not self.progress)):
-      skels = unfused_skeletons[label]
-      skel = Skeleton.simple_merge(skels)
-      skel.id = label
-      skel.extra_attributes = [ 
-        attr for attr in skel.extra_attributes \
-        if attr['data_type'] == 'float32' 
-      ]
-      skel = skel.consolidate()
-      # if self.max_cable_length is not None and skel.cable_length() > self.max_cable_length:
-      #   skeletons[label] = skel.to_precomputed()
-      # else:
-      #   skeletons[label] = kimimaro.postprocess(
-      #     skel, 
-      #     dust_threshold=self.dust_threshold, # voxels 
-      #     tick_threshold=self.tick_threshold, # nm
-      #   ).to_precomputed()
-      skeletons[label] = skel.to_precomputed()
-
-    return skeletons
-
-  def get_unfused(self, labels, filenames, cv, frag_path):
-    skeldirfn = lambda loc: cv.meta.join(cv.skeleton.meta.skeleton_path, loc)
-    filenames = [ skeldirfn(loc) for loc in filenames ]
-
-    block_size = 50
-
-    if len(filenames) < block_size:
-      blocks = [ filenames ]
-      n_blocks = 1
-    else:
-      n_blocks = max(len(filenames) // block_size, 1)
-      blocks = sip(filenames, block_size)
-
-    frag_prefix = frag_path or cv.cloudpath
-    local_input = False
-    if paths.extract(frag_prefix).protocol == "file":
-       local_input = True
-       frag_prefix = frag_prefix.replace("file://", "", 1)
-
-    all_skels = defaultdict(list)
-    for filenames_block in tqdm(blocks, desc="Filename Block", total=n_blocks, disable=(not self.progress)):
-      if local_input:
-        all_files = {}
-        for filename in filenames_block:
-          all_files[filename] = open(os.path.join(frag_prefix, filename), "rb")
-      else:
-        all_files = { 
-          filename: CloudFile(cv.meta.join(frag_prefix, filename), cache_meta=True)
-          for filename in filenames_block 
-        } 
-      
-      for filename, content in tqdm(all_files.items(), desc="Scanning Fragments", disable=(not self.progress)):
-        fragment = MapBuffer(content, frombytesfn=Skeleton.from_precomputed)
-
-        for label in labels:
-          try:
-            skel = fragment[label]
-            skel.id = label
-            all_skels[label].append(skel)
-          except KeyError:
-            continue
-
-        if hasattr(content, "close"):
-          content.close()
-
-    return all_skels
-
-  def locations_for_labels(self, labels, cv):
-    SPATIAL_EXT = re.compile(r'\.spatial$')
-    index_filenames = cv.skeleton.spatial_index.file_locations_per_label(labels)
-    for label, locations in index_filenames.items():
-      for i, location in enumerate(locations):
-        bbx = Bbox.from_filename(re.sub(SPATIAL_EXT, '', location))
-        bbx /= cv.meta.resolution(cv.skeleton.meta.mip)
-        index_filenames[label][i] = bbx.to_filename() + '.frags'
-    return index_filenames
-
-def labels_for_shard(cv, shard_no, progress):
-  """
-  Try to fetch precalculated labels from `$shardno.labels` (faster) otherwise, 
-  compute which labels are applicable to this shard from the shard index (much slower).
-  """
-  labels = CloudFiles(cv.skeleton.meta.layerpath).get_json(shard_no + '.labels')
-  if labels is not None:
-    return labels
-
-  labels = cv.skeleton.spatial_index.query(cv.bounds * cv.resolution)
-  spec = cv.skeleton.reader.spec
-
-  return [ 
-    lbl for lbl in tqdm(labels, desc="Computing Shard Numbers", disable=(not progress))  \
-    if spec.compute_shard_location(lbl).shard_number == shard_no 
-  ]
-
-@queueable
-def ShardedFromUnshardedSkeletonMergeTask(
-  src:str,
-  dest:str,
-  shard_no:str,
-  cache_control:bool = False,
-  skel_dir:Optional[str] = None,
-  progress:bool = False,
-):
-  cv_src = CloudVolume(src)
-
-  if skel_dir is None and 'skeletons' in cv.info:
-    skel_dir = cv.info['skeletons']
-
-  cv_dest = CloudVolume(dest, skel_dir=skel_dir, progress=progress)
-
-  labels = labels_for_shard(cv_dest, shard_no, progress)
-  skeletons = cv_src.skeleton.get(labels)
-  del labels
-
-  if len(skeletons) == 0:
-    return
-
-  skeletons = strip_integer_attributes(skeletons)
-  skeletons = { skel.id: skel.to_precomputed() for skel in skeletons }
-  shard_files = synthesize_shard_files(cv_dest.skeleton.reader.spec, skeletons)
-
-  if len(shard_files) != 1:
-    raise ValueError(
-      "Only one shard file should be generated per task. Expected: {} Got: {} ".format(
-        str(shard_no), ", ".join(shard_files.keys())
-    ))
-
-  cf = CloudFiles(cv_dest.skeleton.meta.layerpath, progress=progress)
-  cf.puts( 
-    ( (fname, data) for fname, data in shard_files.items() ),
-    compress=False,
-    content_type='application/octet-stream',
-    cache_control='no-cache',      
-  )
-
-@queueable
-def DeleteSkeletonFilesTask(
-  cloudpath:str,
-  prefix:str,
-  skel_dir:Optional[str] = None
-):
-  cv = CloudVolume(cloudpath, skel_dir=skel_dir)
-  cf = CloudFiles(cv.skeleton.meta.layerpath)
-  cf.delete(cf.list(prefix=prefix))
-
-
-@queueable
-def TransferSkeletonFilesTask(
-  src:str,
-  dest:str,
-  prefix:str,
-  skel_dir:Optional[str] = None
-):
-  cv_src = CloudVolume(src)
-  cv_dest = CloudVolume(dest, skel_dir=skel_dir)
-
-  cf_src = CloudFiles(cv_src.skeleton.meta.layerpath)
-  cf_dest = CloudFiles(cv_dest.skeleton.meta.layerpath)
-
-  cf_src.transfer_to(cf_dest, paths=cf_src.list(prefix=prefix))

From 7844c310b9a94640cf41f7d3c544bebee838fd8f Mon Sep 17 00:00:00 2001
From: Wan-Qing Yu <wanqing.yu@alleninstitute.org>
Date: Wed, 8 Oct 2025 19:34:03 -0700
Subject: [PATCH 6/6] hide debug messages

---
 igneous/tasks/skeleton.py | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/igneous/tasks/skeleton.py b/igneous/tasks/skeleton.py
index 434b644e..4036489c 100755
--- a/igneous/tasks/skeleton.py
+++ b/igneous/tasks/skeleton.py
@@ -905,8 +905,8 @@ def skeleton_touches_interior_surface(self, skeleton, resolution, vol, tolerance
     # Get which faces are interior (connect to other chunks)
     interior_faces = self.get_interior_faces(vol)
     
-    print(f"DEBUG SURFACE: Interior faces: {interior_faces}")
-    print(f"DEBUG SURFACE: [min_x, max_x, min_y, max_y, min_z, max_z]")
+    # print(f"DEBUG SURFACE: Interior faces: {interior_faces}")
+    # print(f"DEBUG SURFACE: [min_x, max_x, min_y, max_y, min_z, max_z]")
     
     # Check each dimension, but only interior faces
     for dim in range(3):
@@ -917,28 +917,28 @@ def skeleton_touches_interior_surface(self, skeleton, resolution, vol, tolerance
         if interior_faces[min_face_idx]:  # min face is interior
             near_min = np.any(vertices_voxels[:, dim] <= tolerance_voxels)
             if near_min:
-                print(f"DEBUG SURFACE: INTERIOR SURFACE TOUCH detected at min face of dimension {dim}")
+                # print(f"DEBUG SURFACE: INTERIOR SURFACE TOUCH detected at min face of dimension {dim}")
                 return True
                 
         if interior_faces[max_face_idx]:  # max face is interior  
             near_max = np.any(vertices_voxels[:, dim] >= chunk_shape[dim] - tolerance_voxels)
             if near_max:
-                print(f"DEBUG SURFACE: INTERIOR SURFACE TOUCH detected at max face of dimension {dim}")
+                # print(f"DEBUG SURFACE: INTERIOR SURFACE TOUCH detected at max face of dimension {dim}")
                 return True
     
-    print(f"DEBUG SURFACE: NO INTERIOR SURFACE TOUCH detected")
+    # print(f"DEBUG SURFACE: NO INTERIOR SURFACE TOUCH detected")
     return False
     
   def generate_base_id_for_chunk(self):
     """Generate starting ID for interior skeletons using global chunk indexing."""
-    print(f"DEBUG: chunk_index={self.chunk_index}, coords={self.chunk_coords}")
+    # print(f"DEBUG: chunk_index={self.chunk_index}, coords={self.chunk_coords}")
     
     if self.chunk_index is not None:
         base_id = (self.chunk_index + 1) * 1000000 + 1000
-        print(f"DEBUG: Generated base_id={base_id}")
+        # print(f"DEBUG: Generated base_id={base_id}")
         return int(base_id)
     
-    print("DEBUG: No chunk_index, using fallback")
+    # print("DEBUG: No chunk_index, using fallback")
     return 1000000
   
   def extract_subskeleton(self, skeleton, vertex_indices):