seung-lab · william-silversmith · Dec 14, 2021 · Nov 13, 2021 · Nov 13, 2021 · Nov 13, 2021
diff --git a/README.md b/README.md
@@ -395,21 +395,38 @@ tasks = create_deletion_tasks(
 
 Meshing is a two stage process. First, the dataset is divided up into a regular grid of tasks that will be meshed independently of
 each other using the `MeshTask`. The resulting mesh fragments are uploaded to the destination layer's meshing directory 
-(named something like `mesh_mip_3_err_40`). Without additional processing, Neuroglancer has no way of 
+(named something like `mesh_mip_3_err_40`). 
+
+There are two ways do conduct meshing. The standard "unsharded" way can generate a lot of mesh fragment files. It scales to about 100M labels before it starts incurring unreasonable costs on cloud systems. To handle larger volumes, there is the somwhat more difficult to use sharded meshing process that condenses the number of files by orders of magnitude.
+
+#### Unsharded Meshing
+
+Without additional processing, Neuroglancer has no way of 
 knowing the names of these chunks (which will be named something like `$SEGID:0:$BOUNDING_BOX` e.g. `1052:0:0-512_0-512_0-512`). 
 The `$BOUNDING_BOX` part of the name is arbitrary and is the convention used by igneous because it is convenient for debugging.
 
-The manually actuated second stage runs the `MeshManifestTask` which generates files named `$SEGID:0` which contains a short JSON snippet like `{ "fragments": [ "1052:0:0-512_0-512_0-512" ] }`. This file tells Neuroglancer and CloudVolume which mesh files to download when accessing a given segment ID.  
+The manually actuated second stage runs the `MeshManifestTask` which generates files named `$SEGID:0` which contains a short JSON snippet like `{ "fragments": [ "1052:0:0-512_0-512_0-512" ] }`. This file tells Neuroglancer and CloudVolume which mesh files to download when accessing a given segment ID.
+
+#### Sharded Meshing
+
+Sharded Meshes are not only condensed, but also draco encoded with an integer position attribute. The files must be initially meshed and then a set of meshes gathered into the memory of a single machine which can then synthesize the shard file. This requires more time and memory to generate than unsharded meshes, but simplifies management of the resultant data set by creating far fewer files. The shard files have names like `a31.shard`. A sharded dataset is indicated by the info file in the mesh directory having `{ "@type": "neuroglancer_multilod_draco" }`. In the future, multiscale meshes will be supported, but for now we only generate a single resolution.
 
 #### CLI Meshing
 
 The CLI supports only standard Precomputed. Graphene is not currently supported. There are many more options, check out `igneous mesh --help`, `igneous mesh forge --help`, and `igneous mesh merge --help`.
 
 ```bash
+# Standard Unsharded Meshing
 igneous mesh forge $PATH --mip 2 --queue $QUEUE
 igneous execute $QUEUE
 igneous mesh merge $PATH --magnitude 2 --queue $QUEUE
 igneous execute $QUEUE
+
+# Sharded Meshing
+igneous mesh forge $PATH --mip 2 --queue $QUEUE --sharded
+igneous execute $QUEUE
+igneous mesh merge-sharded $PATH --queue $QUEUE
+igneous execute $QUEUE
 ```
 
 #### Scripting Meshing
@@ -440,7 +457,7 @@ an additional 10^magnitude. A high magnitude (3-5+) is appropriate for horizonta
 
 In the future, a third stage might be introduced that fuses all the small fragments into a single file.  
 
-Of note: Meshing is a memory intensive operation. The underlying zmesh library has an optimization for meshing volumes smaller than 512 voxels on the X and Y dimensions which could be helpful to take advantage of. Meshing time scales with the number of labels contained in the volume.
+Of note: Meshing is a memory intensive operation. The underlying zmesh library has an optimization for meshing volumes smaller than 1024 voxels on the X and Y dimensions which could be helpful to take advantage of. Meshing time scales with the number of labels contained in the volume.
 
 ### Skeletonization (SkeletonTask, SkeletonMergeTask)
 

diff --git a/igneous/task_creation/common.py b/igneous/task_creation/common.py
@@ -136,3 +136,67 @@ def graphene_prefixes(
       prefixes.add(num)
 
   return prefixes
+
+def compute_shard_params_for_hashed(
+  num_labels, shard_index_bytes=2**13, minishard_index_bytes=2**15
+):
+  """
+  Computes the shard parameters for objects that
+  have been randomly hashed (e.g. murmurhash) so
+  that the keys are evenly distributed. This is
+  applicable to skeletons and meshes.
+
+  The equations come from the following assumptions.
+  a. The keys are approximately uniformly randomly distributed.
+  b. Preshift bits aren't useful for random keys so are zero.
+  c. Our goal is to optimize the size of the shard index and
+    the minishard indices to be reasonably sized. The default
+    values are set for a 100 Mbps connection.
+  d. The equations below come from finding a solution to 
+    these equations given the constraints provided.
+
+      num_shards * num_minishards_per_shard 
+        = 2^(shard_bits) * 2^(minishard_bits) 
+        = num_labels_in_dataset / labels_per_minishard
+
+      # from defininition of minishard_bits assuming fixed capacity
+      labels_per_minishard = minishard_index_bytes / 3 / 8
+
+      # from definition of minishard bits
+      minishard_bits = ceil(log2(shard_index_bytes / 2 / 8)) 
+
+  Returns: (shard_bits, minishard_bits, preshift_bits)
+  """
+  if num_labels <= 0:
+    return (0,0,0)
+
+  num_minishards_per_shard = shard_index_bytes / 2 / 8
+  labels_per_minishard = minishard_index_bytes / 3 / 8
+  labels_per_shard = num_minishards_per_shard * labels_per_minishard
+
+  if num_labels >= labels_per_shard:
+    minishard_bits = np.ceil(np.log2(num_minishards_per_shard))
+    shard_bits = np.ceil(np.log2(
+      num_labels / (labels_per_minishard * (2 ** minishard_bits))
+    ))
+  elif num_labels >= labels_per_minishard:
+    minishard_bits = np.ceil(np.log2(
+      num_labels / labels_per_minishard
+    ))
+    shard_bits = 0
+  else:
+    minishard_bits = 0
+    shard_bits = 0
+
+  capacity = labels_per_shard * (2 ** shard_bits)
+  utilized_capacity = num_labels / capacity
+
+  # Try to pack shards to capacity, allow going
+  # about 10% over the input level.
+  if utilized_capacity <= 0.55:
+    shard_bits -= 1
+
+  minishard_bits = max(minishard_bits, 0)
+  shard_bits = max(shard_bits, 0)
+
+  return (int(shard_bits), int(minishard_bits), 0)
diff --git a/igneous/task_creation/mesh.py b/igneous/task_creation/mesh.py
@@ -1,4 +1,5 @@
 import copy
+from collections import defaultdict
 from functools import reduce, partial
 from typing import (
   Any, Dict, Optional, 
@@ -9,20 +10,24 @@
 from time import strftime
 
 import numpy as np
+from tqdm import tqdm
 
 import cloudvolume
 import cloudvolume.exceptions
 from cloudvolume import CloudVolume
 from cloudvolume.lib import Vec, Bbox, max2, min2, xyzrange, find_closest_divisor, yellow, jsonify
+from cloudvolume.datasource.precomputed.sharding import ShardingSpecification
 from cloudfiles import CloudFiles
 
 from igneous.tasks import (
   MeshTask, MeshManifestTask, GrapheneMeshTask,
-  MeshSpatialIndex, MultiResUnshardedMeshMergeTask
+  MeshSpatialIndex, MultiResShardedMeshMergeTask,
+  MultiResUnshardedMeshMergeTask
 )
 from .common import (
   operator_contact, FinelyDividedTaskIterator, 
-  get_bounds, num_tasks, graphene_prefixes
+  get_bounds, num_tasks, graphene_prefixes,
+  compute_shard_params_for_hashed
 )
 
 __all__ = [
@@ -32,6 +37,7 @@
   "create_graphene_hybrid_mesh_manifest_tasks",
   "create_spatial_index_mesh_tasks",
   "create_unsharded_multires_mesh_tasks",
+  "create_sharded_multires_mesh_tasks",
 ]
 
 # split the work up into ~1000 tasks (magnitude 3)
@@ -297,23 +303,20 @@ def on_finish(self):
 
   return SpatialIndexMeshTaskIterator(vol.bounds, shape)
 
-def create_unsharded_multires_mesh_tasks(
-  cloudpath:str, mip:int, num_lod:int = 1, 
-  magnitude:int = 3, mesh_dir:str = None,
-  vertex_quantization_bits:int = 16
-) -> Iterator:
+def configure_multires_info(
+  cloudpath:str,
+  vertex_quantization_bits:int, 
+  mesh_dir:str
+):
   """
-  vertex_quantization_bits: 10 or 16. Adjusts the precision
-    of mesh vertices.
+  Computes properties and uploads a multires 
+  mesh info file
   """
-  # split the work up into ~1000 tasks (magnitude 3)
-  assert int(magnitude) == magnitude
   assert vertex_quantization_bits in (10, 16)
 
-  vol = CloudVolume(cloudpath, mip=mip)
+  vol = CloudVolume(cloudpath)
 
-  if mesh_dir is None:
-    mesh_dir = f"mesh_mip_{mip}_err_40"
+  mesh_dir = mesh_dir or vol.info.get("mesh", None)
 
   if not "mesh" in vol.info:
     vol.info['mesh'] = mesh_dir
@@ -340,6 +343,26 @@ def create_unsharded_multires_mesh_tasks(
       cache_control="no-cache"
     )
 
+def create_unsharded_multires_mesh_tasks(
+  cloudpath:str, num_lod:int = 1, 
+  magnitude:int = 3, mesh_dir:str = None,
+  vertex_quantization_bits:int = 16
+) -> Iterator:
+  """
+  vertex_quantization_bits: 10 or 16. Adjusts the precision
+    of mesh vertices.
+  """
+  # split the work up into ~1000 tasks (magnitude 3)
+  assert int(magnitude) == magnitude
+
+  configure_multires_info(
+    cloudpath, 
+    vertex_quantization_bits, 
+    mesh_dir
+  )
+
+  vol = CloudVolume(cloudpath, mip=mip)
+
   start = 10 ** (magnitude - 1)
   end = 10 ** magnitude
 
@@ -365,3 +388,97 @@ def __iter__(self):
         )
 
   return UnshardedMultiResTaskIterator()
+
+def create_sharded_multires_mesh_tasks(
+  cloudpath:str, 
+  shard_index_bytes=2**13, 
+  minishard_index_bytes=2**15,
+  num_lod:int = 1, 
+  draco_compression_level:int = 1,
+  vertex_quantization_bits:int = 16,
+  minishard_index_encoding="gzip", 
+  mesh_dir:Optional[str] = None, 
+  spatial_index_db:Optional[str] = None
+) -> Iterator[MultiResShardedMeshMergeTask]: 
+
+  configure_multires_info(
+    cloudpath, 
+    vertex_quantization_bits, 
+    mesh_dir
+  )
+
+  # rebuild b/c sharding changes the mesh source class
+  cv = CloudVolume(cloudpath, progress=True, spatial_index_db=spatial_index_db) 
+  cv.mip = cv.mesh.meta.mip
+
+  # 17 sec to download for pinky100
+  all_labels = cv.mesh.spatial_index.query(cv.bounds * cv.resolution)
+
+  (shard_bits, minishard_bits, preshift_bits) = \
+    compute_shard_params_for_hashed(
+      num_labels=len(all_labels),
+      shard_index_bytes=int(shard_index_bytes),
+      minishard_index_bytes=int(minishard_index_bytes),
+    )
+
+  spec = ShardingSpecification(
+    type='neuroglancer_uint64_sharded_v1',
+    preshift_bits=preshift_bits,
+    hash='murmurhash3_x86_128',
+    minishard_bits=minishard_bits,
+    shard_bits=shard_bits,
+    minishard_index_encoding=minishard_index_encoding,
+    data_encoding="raw", # draco encoded meshes
+  )
+
+  cv.mesh.meta.info['sharding'] = spec.to_dict()
+  cv.mesh.meta.commit_info()
+
+  cv = CloudVolume(cloudpath)
+
+  # perf: ~66.5k hashes/sec on M1 ARM64
+  shardfn = lambda lbl: cv.mesh.reader.spec.compute_shard_location(lbl).shard_number
+
+  shard_labels = defaultdict(list)
+  for label in tqdm(all_labels, desc="Hashes"):
+    shard_labels[shardfn(label)].append(label)
+  del all_labels
+
+  cf = CloudFiles(cv.skeleton.meta.layerpath, progress=True)
+  files = ( 
+    (str(shardno) + '.labels', labels) 
+    for shardno, labels in shard_labels.items() 
+  )
+  cf.put_jsons(
+    files, compress="gzip", 
+    cache_control="no-cache", total=len(shard_labels)
+  )
+
+  cv.provenance.processing.append({
+    'method': {
+      'task': 'MultiResShardedMeshMergeTask',
+      'cloudpath': cloudpath,
+      'mip': cv.mesh.meta.mip,
+      'num_lod': num_lod,
+      'vertex_quantization_bits': vertex_quantization_bits,
+      'preshift_bits': preshift_bits, 
+      'minishard_bits': minishard_bits, 
+      'shard_bits': shard_bits,
+      'mesh_dir': mesh_dir,
+      'draco_compression_level': draco_compression_level,
+    },
+    'by': operator_contact(),
+    'date': strftime('%Y-%m-%d %H:%M %Z'),
+  }) 
+  cv.commit_provenance()
+
+  return [
+    partial(MultiResShardedMeshMergeTask,
+      cloudpath, shard_no, 
+      num_lod=num_lod,
+      mesh_dir=mesh_dir, 
+      spatial_index_db=spatial_index_db,
+      draco_compression_level=draco_compression_level,
+    )
+    for shard_no in shard_labels.keys()
+  ]
diff --git a/igneous/task_creation/skeleton.py b/igneous/task_creation/skeleton.py
@@ -19,7 +19,7 @@
 
 from .common import (
   operator_contact, FinelyDividedTaskIterator, 
-  get_bounds, num_tasks
+  get_bounds, num_tasks, compute_shard_params_for_hashed
 )
 
 __all__ = [
@@ -267,10 +267,24 @@ def __iter__(self):
 
 def create_sharded_skeleton_merge_tasks(
     layer_path, dust_threshold, tick_threshold,
-    preshift_bits, minishard_bits, shard_bits,
+    shard_index_bytes=2**13,
+    minishard_index_bytes=2**15,
     minishard_index_encoding='gzip', data_encoding='gzip',
-    max_cable_length=None
+    max_cable_length=None, spatial_index_db=None
   ): 
+  cv = CloudVolume(layer_path, progress=True, spatial_index_db=spatial_index_db) 
+  cv.mip = cv.skeleton.meta.mip
+
+  # 17 sec to download for pinky100
+  all_labels = cv.skeleton.spatial_index.query(cv.bounds * cv.resolution)
+
+  (shard_bits, minishard_bits, preshift_bits) = \
+    compute_shard_params_for_hashed(
+      num_labels=len(all_labels),
+      shard_index_bytes=int(shard_index_bytes),
+      minishard_index_bytes=int(minishard_index_bytes),
+    )
+
   spec = ShardingSpecification(
     type='neuroglancer_uint64_sharded_v1',
     preshift_bits=preshift_bits,
@@ -280,16 +294,13 @@ def create_sharded_skeleton_merge_tasks(
     minishard_index_encoding=minishard_index_encoding,
     data_encoding=data_encoding,
   )
-
-  cv = CloudVolume(layer_path)
   cv.skeleton.meta.info['sharding'] = spec.to_dict()
   cv.skeleton.meta.commit_info()
 
-  cv = CloudVolume(layer_path, progress=True) # rebuild b/c sharding changes the skeleton object
+  # rebuild b/c sharding changes the skeleton source
+  cv = CloudVolume(layer_path, progress=True, spatial_index_db=spatial_index_db) 
   cv.mip = cv.skeleton.meta.mip
 
-  # 17 sec to download for pinky100
-  all_labels = cv.skeleton.spatial_index.query(cv.bounds * cv.resolution)
   # perf: ~36k hashes/sec
   shardfn = lambda lbl: cv.skeleton.reader.spec.compute_shard_location(lbl).shard_number
 
@@ -324,14 +335,14 @@ def create_sharded_skeleton_merge_tasks(
   }) 
   cv.commit_provenance()
 
-  return (
+  return [
     ShardedSkeletonMergeTask(
       layer_path, shard_no, 
       dust_threshold, tick_threshold,
       max_cable_length=max_cable_length
     )
     for shard_no in shard_labels.keys()
-  )
+  ]
 
 # split the work up into ~1000 tasks (magnitude 3)
 def create_unsharded_skeleton_merge_tasks(    

diff --git a/igneous/tasks/__init__.py b/igneous/tasks/__init__.py
@@ -6,6 +6,7 @@
   MeshTask, MeshManifestTask, 
   GrapheneMeshTask, MeshSpatialIndex,
   MultiResUnshardedMeshMergeTask,
+  MultiResShardedMeshMergeTask,
 )
 from .image import (
   HyperSquareConsensusTask, #HyperSquareTask,