diff --git a/src/sample/bitonicSort/atomicToZero.wgsl b/src/sample/bitonicSort/atomicToZero.wgsl
new file mode 100644
index 00000000..23e7e4ee
--- /dev/null
+++ b/src/sample/bitonicSort/atomicToZero.wgsl
@@ -0,0 +1,7 @@
+@group(0) @binding(3) var<storage, read_write> counter: atomic<u32>;
+
+@compute @workgroup_size(1, 1, 1)
+fn atomicToZero() {
+  let counterValue = atomicLoad(&counter);
+  atomicSub(&counter, counterValue);
+}
\ No newline at end of file
diff --git a/src/sample/bitonicSort/bitonicDisplay.frag.wgsl b/src/sample/bitonicSort/bitonicDisplay.frag.wgsl
index 3f4a17ea..17842eab 100644
--- a/src/sample/bitonicSort/bitonicDisplay.frag.wgsl
+++ b/src/sample/bitonicSort/bitonicDisplay.frag.wgsl
@@ -1,6 +1,13 @@
-struct Uniforms {
+struct ComputeUniforms {
   width: f32,
   height: f32,
+  algo: u32,
+  blockHeight: u32,
+}
+
+struct FragmentUniforms {
+  // boolean, either 0 or 1
+  highlight: u32,
 }
 
 struct VertexOutput {
@@ -8,8 +15,11 @@ struct VertexOutput {
   @location(0) fragUV: vec2<f32>
 }
 
-@group(0) @binding(0) var<uniform> uniforms: Uniforms;
-@group(1) @binding(0) var<storage, read> data: array<u32>;
+// Uniforms from compute shader
+@group(0) @binding(0) var<storage, read> data: array<u32>;
+@group(0) @binding(2) var<uniform> uniforms: ComputeUniforms;
+// Fragment shader uniforms
+@group(1) @binding(0) var<uniform> fragment_uniforms: FragmentUniforms;
 
 @fragment
 fn frag_main(input: VertexOutput) -> @location(0) vec4<f32> {
@@ -28,6 +38,16 @@ fn frag_main(input: VertexOutput) -> @location(0) vec4<f32> {
 
   var subtracter = f32(colorChanger) / (uniforms.width * uniforms.height);
 
+  if (fragment_uniforms.highlight == 1) {
+    return select(
+      //If element is above halfHeight, highlight green
+      vec4<f32>(vec3<f32>(0.0, 1.0 - subtracter, 0.0).rgb, 1.0),
+      //If element is below halfheight, highlight red
+      vec4<f32>(vec3<f32>(1.0 - subtracter, 0.0, 0.0).rgb, 1.0),
+      elementIndex % uniforms.blockHeight < uniforms.blockHeight / 2
+    );
+  }
+
   var color: vec3<f32> = vec3f(
     1.0 - subtracter
   );
diff --git a/src/sample/bitonicSort/bitonicDisplay.ts b/src/sample/bitonicSort/bitonicDisplay.ts
index 210ef232..b86f2905 100644
--- a/src/sample/bitonicSort/bitonicDisplay.ts
+++ b/src/sample/bitonicSort/bitonicDisplay.ts
@@ -1,14 +1,13 @@
 import {
-  BindGroupsObjectsAndLayout,
-  createBindGroupDescriptor,
+  BindGroupCluster,
   Base2DRendererClass,
+  createBindGroupCluster,
 } from './utils';
 
 import bitonicDisplay from './bitonicDisplay.frag.wgsl';
 
 interface BitonicDisplayRenderArgs {
-  width: number;
-  height: number;
+  highlight: number;
 }
 
 export default class BitonicDisplayRenderer extends Base2DRendererClass {
@@ -19,14 +18,13 @@ export default class BitonicDisplayRenderer extends Base2DRendererClass {
 
   switchBindGroup: (name: string) => void;
   setArguments: (args: BitonicDisplayRenderArgs) => void;
-  computeBGDescript: BindGroupsObjectsAndLayout;
+  computeBGDescript: BindGroupCluster;
 
   constructor(
     device: GPUDevice,
     presentationFormat: GPUTextureFormat,
     renderPassDescriptor: GPURenderPassDescriptor,
-    bindGroupNames: string[],
-    computeBGDescript: BindGroupsObjectsAndLayout,
+    computeBGDescript: BindGroupCluster,
     label: string
   ) {
     super();
@@ -34,11 +32,11 @@ export default class BitonicDisplayRenderer extends Base2DRendererClass {
     this.computeBGDescript = computeBGDescript;
 
     const uniformBuffer = device.createBuffer({
-      size: Float32Array.BYTES_PER_ELEMENT * 2,
+      size: Uint32Array.BYTES_PER_ELEMENT,
       usage: GPUBufferUsage.UNIFORM | GPUBufferUsage.COPY_DST,
     });
 
-    const bgDescript = createBindGroupDescriptor(
+    const bgCluster = createBindGroupCluster(
       [0],
       [GPUShaderStage.FRAGMENT],
       ['buffer'],
@@ -48,41 +46,30 @@ export default class BitonicDisplayRenderer extends Base2DRendererClass {
       device
     );
 
-    this.currentBindGroup = bgDescript.bindGroups[0];
-    this.currentBindGroupName = bindGroupNames[0];
-
-    this.bindGroupMap = {};
-
-    bgDescript.bindGroups.forEach((bg, idx) => {
-      this.bindGroupMap[bindGroupNames[idx]] = bg;
-    });
+    this.currentBindGroup = bgCluster.bindGroups[0];
 
     this.pipeline = super.create2DRenderPipeline(
       device,
       label,
-      [bgDescript.bindGroupLayout, this.computeBGDescript.bindGroupLayout],
+      [this.computeBGDescript.bindGroupLayout, bgCluster.bindGroupLayout],
       bitonicDisplay,
       presentationFormat
     );
 
-    this.switchBindGroup = (name: string) => {
-      this.currentBindGroup = this.bindGroupMap[name];
-      this.currentBindGroupName = name;
-    };
-
     this.setArguments = (args: BitonicDisplayRenderArgs) => {
-      super.setUniformArguments(device, uniformBuffer, args, [
-        'width',
-        'height',
-      ]);
+      device.queue.writeBuffer(
+        uniformBuffer,
+        0,
+        new Uint32Array([args.highlight])
+      );
     };
   }
 
   startRun(commandEncoder: GPUCommandEncoder, args: BitonicDisplayRenderArgs) {
     this.setArguments(args);
     super.executeRun(commandEncoder, this.renderPassDescriptor, this.pipeline, [
-      this.currentBindGroup,
       this.computeBGDescript.bindGroups[0],
+      this.currentBindGroup,
     ]);
   }
 }
diff --git a/src/sample/bitonicSort/computeShader.ts b/src/sample/bitonicSort/computeShader.ts
index 4011eb41..e0ca6134 100644
--- a/src/sample/bitonicSort/computeShader.ts
+++ b/src/sample/bitonicSort/computeShader.ts
@@ -15,13 +15,19 @@ struct Uniforms {
 }
 
 // Create local workgroup data that can contain all elements
-
 var<workgroup> local_data: array<u32, ${threadsPerWorkgroup * 2}>;
 
-//Compare and swap values in local_data
-fn compare_and_swap(idx_before: u32, idx_after: u32) {
+// Define groups (functions refer to this data)
+@group(0) @binding(0) var<storage, read> input_data: array<u32>;
+@group(0) @binding(1) var<storage, read_write> output_data: array<u32>;
+@group(0) @binding(2) var<uniform> uniforms: Uniforms;
+@group(0) @binding(3) var<storage, read_write> counter: atomic<u32>;
+
+// Compare and swap values in local_data
+fn local_compare_and_swap(idx_before: u32, idx_after: u32) {
   //idx_before should always be < idx_after
   if (local_data[idx_after] < local_data[idx_before]) {
+    atomicAdd(&counter, 1);
     var temp: u32 = local_data[idx_before];
     local_data[idx_before] = local_data[idx_after];
     local_data[idx_after] = temp;
@@ -30,65 +36,94 @@ fn compare_and_swap(idx_before: u32, idx_after: u32) {
 }
 
 // thread_id goes from 0 to threadsPerWorkgroup
-fn prepare_flip(thread_id: u32, block_height: u32) {
-  let q: u32 = ((2 * thread_id) / block_height) * block_height;
+fn get_flip_indices(thread_id: u32, block_height: u32) -> vec2<u32> {
+  // Caculate index offset (i.e move indices into correct block)
+  let block_offset: u32 = ((2 * thread_id) / block_height) * block_height;
   let half_height = block_height / 2;
+  // Calculate index spacing
   var idx: vec2<u32> = vec2<u32>(
     thread_id % half_height, block_height - (thread_id % half_height) - 1,
   );
-  idx.x += q;
-  idx.y += q;
-  compare_and_swap(idx.x, idx.y);
+  idx.x += block_offset;
+  idx.y += block_offset;
+  return idx;
 }
 
-fn prepare_disperse(thread_id: u32, block_height: u32) {
-  var q: u32 = ((2 * thread_id) / block_height) * block_height;
+fn get_disperse_indices(thread_id: u32, block_height: u32) -> vec2<u32> {
+  var block_offset: u32 = ((2 * thread_id) / block_height) * block_height;
   let half_height = block_height / 2;
 	var idx: vec2<u32> = vec2<u32>(
     thread_id % half_height, (thread_id % half_height) + half_height
   );
-  idx.x += q;
-  idx.y += q;
-	compare_and_swap(idx.x, idx.y);
+  idx.x += block_offset;
+  idx.y += block_offset;
+  return idx;
 }
 
-@group(0) @binding(0) var<storage, read> input_data: array<u32>;
-@group(0) @binding(1) var<storage, read_write> output_data: array<u32>;
-@group(0) @binding(2) var<uniform> uniforms: Uniforms;
+fn global_compare_and_swap(idx_before: u32, idx_after: u32) {
+  if (input_data[idx_after] < input_data[idx_before]) {
+    output_data[idx_before] = input_data[idx_after];
+    output_data[idx_after] = input_data[idx_before];
+  } 
+}
+
+// Constants/enum
+const ALGO_NONE = 0;
+const ALGO_LOCAL_FLIP = 1;
+const ALGO_LOCAL_DISPERSE = 2;
+const ALGO_GLOBAL_FLIP = 3;
 
 // Our compute shader will execute specified # of threads or elements / 2 threads
 @compute @workgroup_size(${threadsPerWorkgroup}, 1, 1)
 fn computeMain(
   @builtin(global_invocation_id) global_id: vec3<u32>,
   @builtin(local_invocation_id) local_id: vec3<u32>,
+  @builtin(workgroup_id) workgroup_id: vec3<u32>,
 ) {
-  //Each thread will populate the workgroup data... (1 thread for every 2 elements)
-  local_data[local_id.x * 2] = input_data[local_id.x * 2];
-  local_data[local_id.x * 2 + 1] = input_data[local_id.x * 2 + 1];
+
+  let offset = ${threadsPerWorkgroup} * 2 * workgroup_id.x;
+  // If we will perform a local swap, then populate the local data
+  if (uniforms.algo <= 2) {
+    // Assign range of input_data to local_data.
+    // Range cannot exceed maxWorkgroupsX * 2
+    // Each thread will populate the workgroup data... (1 thread for every 2 elements)
+    local_data[local_id.x * 2] = input_data[offset + local_id.x * 2];
+    local_data[local_id.x * 2 + 1] = input_data[offset + local_id.x * 2 + 1];
+  }
 
   //...and wait for each other to finish their own bit of data population.
   workgroupBarrier();
 
-  var num_elements = uniforms.width * uniforms.height;
-
   switch uniforms.algo {
-    case 1: { //Local Flip
-      prepare_flip(local_id.x, uniforms.blockHeight);
+    case 1: { // Local Flip
+      let idx = get_flip_indices(local_id.x, uniforms.blockHeight);
+      local_compare_and_swap(idx.x, idx.y);
+    } 
+    case 2: { // Local Disperse
+      let idx = get_disperse_indices(local_id.x, uniforms.blockHeight);
+      local_compare_and_swap(idx.x, idx.y);
+    } 
+    case 3: { // Global Flip
+      let idx = get_flip_indices(global_id.x, uniforms.blockHeight);
+      global_compare_and_swap(idx.x, idx.y);
     }
-    case 2: { //Local Disperse
-      prepare_disperse(local_id.x, uniforms.blockHeight);
+    case 4: { 
+      let idx = get_disperse_indices(global_id.x, uniforms.blockHeight);
+      global_compare_and_swap(idx.x, idx.y);
     }
     default: { 
       
     }
   }
 
-  //Ensure that all threads have swapped their own regions of data
+  // Ensure that all threads have swapped their own regions of data
   workgroupBarrier();
 
-  //Repopulate global data with local data
-  output_data[local_id.x * 2] = local_data[local_id.x * 2];
-  output_data[local_id.x * 2 + 1] = local_data[local_id.x * 2 + 1];
+  if (uniforms.algo <= ALGO_LOCAL_DISPERSE) {
+    //Repopulate global data with local data
+    output_data[offset + local_id.x * 2] = local_data[local_id.x * 2];
+    output_data[offset + local_id.x * 2 + 1] = local_data[local_id.x * 2 + 1];
+  }
 
 }`;
 };
diff --git a/src/sample/bitonicSort/main.ts b/src/sample/bitonicSort/main.ts
index cc8e5865..1ef69e40 100644
--- a/src/sample/bitonicSort/main.ts
+++ b/src/sample/bitonicSort/main.ts
@@ -1,17 +1,18 @@
 import { makeSample, SampleInit } from '../../components/SampleLayout';
-import { SampleInitFactoryWebGPU } from './utils';
-import { createBindGroupDescriptor } from './utils';
+import { createBindGroupCluster, SampleInitFactoryWebGPU } from './utils';
 import BitonicDisplayRenderer from './bitonicDisplay';
 import bitonicDisplay from './bitonicDisplay.frag.wgsl';
 import { NaiveBitonicCompute } from './computeShader';
 import fullscreenTexturedQuad from '../../shaders/fullscreenTexturedQuad.wgsl';
+import atomicToZero from './atomicToZero.wgsl';
 
 // Type of step that will be executed in our shader
 enum StepEnum {
-  NONE = 0,
-  FLIP_LOCAL = 1,
-  DISPERSE_LOCAL = 2,
-  FLIP_DISPERSE_LOCAL = 3,
+  NONE,
+  FLIP_LOCAL,
+  DISPERSE_LOCAL,
+  FLIP_GLOBAL,
+  DISPERSE_GLOBAL,
 }
 
 // String access to StepEnum
@@ -19,7 +20,10 @@ type StepType =
   | 'NONE'
   | 'FLIP_LOCAL'
   | 'DISPERSE_LOCAL'
-  | 'FLIP_DISPERSE_LOCAL';
+  | 'FLIP_GLOBAL'
+  | 'DISPERSE_GLOBAL';
+
+type DisplayType = 'Elements' | 'Swap Highlight';
 
 // Gui settings object
 interface SettingsInterface {
@@ -27,44 +31,65 @@ interface SettingsInterface {
   'Grid Width': number;
   'Grid Height': number;
   'Total Threads': number;
-  hoveredElement: number;
-  swappedElement: number;
+  'Hovered Cell': number;
+  'Swapped Cell': number;
+  'Step Index': number;
+  'Total Steps': number;
   'Prev Step': StepType;
   'Next Step': StepType;
   'Prev Swap Span': number;
   'Next Swap Span': number;
-  workLoads: number;
+  'Total Workgroups': number;
+  'Display Mode': DisplayType;
+  'Total Swaps': number;
   executeStep: boolean;
   'Randomize Values': () => void;
   'Execute Sort Step': () => void;
   'Log Elements': () => void;
   'Complete Sort': () => void;
-  sortSpeed: number;
+  'Sort Speed': number;
 }
 
+const getNumSteps = (numElements: number) => {
+  const n = Math.log2(numElements);
+  return (n * (n + 1)) / 2;
+};
+
 let init: SampleInit;
 SampleInitFactoryWebGPU(
   async ({ pageState, device, gui, presentationFormat, context, canvas }) => {
-    const maxWorkgroupsX = device.limits.maxComputeWorkgroupSizeX;
+    const maxThreadsX = device.limits.maxComputeWorkgroupSizeX;
 
     const totalElementLengths = [];
-    for (let i = maxWorkgroupsX * 2; i >= 4; i /= 2) {
+    const maxElements = maxThreadsX * 32;
+    for (let i = maxElements; i >= 4; i /= 2) {
       totalElementLengths.push(i);
     }
 
+    const defaultGridWidth =
+      Math.sqrt(maxElements) % 2 === 0
+        ? Math.floor(Math.sqrt(maxElements))
+        : Math.floor(Math.sqrt(maxElements / 2));
+
+    const defaultGridHeight = maxElements / defaultGridWidth;
+
     const settings: SettingsInterface = {
       // number of cellElements. Must equal gridWidth * gridHeight and 'Total Threads' * 2
-      'Total Elements': 16,
+      'Total Elements': maxElements,
       // width of screen in cells.
-      'Grid Width': 4,
+      'Grid Width': defaultGridWidth,
       // height of screen in cells
-      'Grid Height': 4,
+      'Grid Height': defaultGridHeight,
       // number of threads to execute in a workgroup ('Total Threads', 1, 1)
-      'Total Threads': 16 / 2,
-      // currently highlighted element
-      hoveredElement: 0,
-      // element the hoveredElement just swapped with,
-      swappedElement: 1,
+      'Total Threads': maxThreadsX,
+      // Cell in element grid mouse element is hovering over
+      'Hovered Cell': 0,
+      // element the hovered cell just swapped with,
+      'Swapped Cell': 1,
+      // Index of current step
+      'Step Index': 0,
+      // Total steps to sort current number of elements
+      'Total Steps': getNumSteps(maxElements),
       // Previously executed step
       'Prev Step': 'NONE',
       // Next step to execute
@@ -73,10 +98,13 @@ SampleInitFactoryWebGPU(
       'Prev Swap Span': 0,
       // Max thread span of next block
       'Next Swap Span': 2,
-      // workloads to dispatch per frame,
-      workLoads: 1,
+      // Workgroups to dispatch per frame,
+      'Total Workgroups': maxElements / (maxThreadsX * 2),
+      // The number of swap operations executed over time
+      'Total Swaps': 0,
       // Whether we will dispatch a workload this frame
       executeStep: false,
+      'Display Mode': 'Elements',
       'Randomize Values': () => {
         return;
       },
@@ -89,7 +117,7 @@ SampleInitFactoryWebGPU(
       'Complete Sort': () => {
         return;
       },
-      sortSpeed: 200,
+      'Sort Speed': 50,
     };
 
     // Initialize initial elements array
@@ -98,7 +126,8 @@ SampleInitFactoryWebGPU(
     );
 
     // Initialize elementsBuffer and elementsStagingBuffer
-    const elementsBufferSize = Float32Array.BYTES_PER_ELEMENT * 512;
+    const elementsBufferSize =
+      Float32Array.BYTES_PER_ELEMENT * totalElementLengths[0];
     // Initialize input, output, staging buffers
     const elementsInputBuffer = device.createBuffer({
       size: elementsBufferSize,
@@ -113,6 +142,17 @@ SampleInitFactoryWebGPU(
       usage: GPUBufferUsage.MAP_READ | GPUBufferUsage.COPY_DST,
     });
 
+    // Initialize atomic swap buffer on GPU and CPU. Counts number of swaps actually performed by
+    // compute shader (when value at index x is greater than value at index y)
+    const atomicSwapsOutputBuffer = device.createBuffer({
+      size: Uint32Array.BYTES_PER_ELEMENT,
+      usage: GPUBufferUsage.STORAGE | GPUBufferUsage.COPY_SRC,
+    });
+    const atomicSwapsStagingBuffer = device.createBuffer({
+      size: Uint32Array.BYTES_PER_ELEMENT,
+      usage: GPUBufferUsage.MAP_READ | GPUBufferUsage.COPY_DST,
+    });
+
     // Create uniform buffer for compute shader
     const computeUniformsBuffer = device.createBuffer({
       // width, height, blockHeight, algo
@@ -120,29 +160,36 @@ SampleInitFactoryWebGPU(
       usage: GPUBufferUsage.UNIFORM | GPUBufferUsage.COPY_DST,
     });
 
-    const computeBGDescript = createBindGroupDescriptor(
-      [0, 1, 2],
+    const computeBGCluster = createBindGroupCluster(
+      [0, 1, 2, 3],
       [
         GPUShaderStage.COMPUTE | GPUShaderStage.FRAGMENT,
         GPUShaderStage.COMPUTE,
+        GPUShaderStage.COMPUTE | GPUShaderStage.FRAGMENT,
         GPUShaderStage.COMPUTE,
       ],
-      ['buffer', 'buffer', 'buffer'],
-      [{ type: 'read-only-storage' }, { type: 'storage' }, { type: 'uniform' }],
+      ['buffer', 'buffer', 'buffer', 'buffer'],
+      [
+        { type: 'read-only-storage' },
+        { type: 'storage' },
+        { type: 'uniform' },
+        { type: 'storage' },
+      ],
       [
         [
           { buffer: elementsInputBuffer },
           { buffer: elementsOutputBuffer },
           { buffer: computeUniformsBuffer },
+          { buffer: atomicSwapsOutputBuffer },
         ],
       ],
-      'NaiveBitonicSort',
+      'BitonicSort',
       device
     );
 
     let computePipeline = device.createComputePipeline({
       layout: device.createPipelineLayout({
-        bindGroupLayouts: [computeBGDescript.bindGroupLayout],
+        bindGroupLayouts: [computeBGCluster.bindGroupLayout],
       }),
       compute: {
         module: device.createShaderModule({
@@ -152,6 +199,19 @@ SampleInitFactoryWebGPU(
       },
     });
 
+    // Simple pipeline that zeros out an atomic value at group 0 binding 3
+    const atomicToZeroComputePipeline = device.createComputePipeline({
+      layout: device.createPipelineLayout({
+        bindGroupLayouts: [computeBGCluster.bindGroupLayout],
+      }),
+      compute: {
+        module: device.createShaderModule({
+          code: atomicToZero,
+        }),
+        entryPoint: 'atomicToZero',
+      },
+    });
+
     // Create bitonic debug renderer
     const renderPassDescriptor: GPURenderPassDescriptor = {
       colorAttachments: [
@@ -169,13 +229,25 @@ SampleInitFactoryWebGPU(
       device,
       presentationFormat,
       renderPassDescriptor,
-      ['default'],
-      computeBGDescript,
+      computeBGCluster,
       'BitonicDisplay'
     );
 
     const resetExecutionInformation = () => {
-      totalThreadsCell.setValue(settings['Total Elements'] / 2);
+      // Total threads are either elements / 2 or maxWorkgroupsSizeX
+      totalThreadsController.setValue(
+        Math.min(settings['Total Elements'] / 2, maxThreadsX)
+      );
+
+      // Dispatch a workgroup for every (Max threads * 2) elements
+      const workgroupsPerStep =
+        (settings['Total Elements'] - 1) / (maxThreadsX * 2);
+
+      totalWorkgroupsController.setValue(Math.ceil(workgroupsPerStep));
+
+      // Reset step Index and number of steps based on elements size
+      stepIndexController.setValue(0);
+      totalStepsController.setValue(getNumSteps(settings['Total Elements']));
 
       // Get new width and height of screen display in cells
       const newCellWidth =
@@ -183,16 +255,27 @@ SampleInitFactoryWebGPU(
           ? Math.floor(Math.sqrt(settings['Total Elements']))
           : Math.floor(Math.sqrt(settings['Total Elements'] / 2));
       const newCellHeight = settings['Total Elements'] / newCellWidth;
-      gridWidthCell.setValue(newCellWidth);
-      gridHeightCell.setValue(newCellHeight);
+      gridWidthController.setValue(newCellWidth);
+      gridHeightController.setValue(newCellHeight);
 
       // Set prevStep to None (restart) and next step to FLIP
-      prevStepCell.setValue('NONE');
-      nextStepCell.setValue('FLIP_LOCAL');
+      prevStepController.setValue('NONE');
+      nextStepController.setValue('FLIP_LOCAL');
 
       // Reset block heights
-      prevBlockHeightCell.setValue(0);
-      nextBlockHeightCell.setValue(2);
+      prevBlockHeightController.setValue(0);
+      nextBlockHeightController.setValue(2);
+
+      // Reset Total Swaps by setting atomic value to 0
+      const commandEncoder = device.createCommandEncoder();
+      const computePassEncoder = commandEncoder.beginComputePass();
+      computePassEncoder.setPipeline(atomicToZeroComputePipeline);
+      computePassEncoder.setBindGroup(0, computeBGCluster.bindGroups[0]);
+      computePassEncoder.dispatchWorkgroups(1);
+      computePassEncoder.end();
+      device.queue.submit([commandEncoder.finish()]);
+      totalSwapsController.setValue(0);
+
       highestBlockHeight = 2;
     };
 
@@ -221,7 +304,7 @@ SampleInitFactoryWebGPU(
       // Create new shader invocation with workgroupSize that reflects number of threads
       computePipeline = device.createComputePipeline({
         layout: device.createPipelineLayout({
-          bindGroupLayouts: [computeBGDescript.bindGroupLayout],
+          bindGroupLayouts: [computeBGCluster.bindGroupLayout],
         }),
         compute: {
           module: device.createShaderModule({
@@ -237,16 +320,17 @@ SampleInitFactoryWebGPU(
 
     randomizeElementArray();
 
-    const setSwappedElement = () => {
+    const setSwappedCell = () => {
       let swappedIndex: number;
       switch (settings['Next Step']) {
         case 'FLIP_LOCAL':
+        case 'FLIP_GLOBAL':
           {
             const blockHeight = settings['Next Swap Span'];
-            const p2 = Math.floor(settings.hoveredElement / blockHeight) + 1;
-            const p3 = settings.hoveredElement % blockHeight;
+            const p2 = Math.floor(settings['Hovered Cell'] / blockHeight) + 1;
+            const p3 = settings['Hovered Cell'] % blockHeight;
             swappedIndex = blockHeight * p2 - p3 - 1;
-            swappedElementCell.setValue(swappedIndex);
+            swappedCellController.setValue(swappedIndex);
           }
           break;
         case 'DISPERSE_LOCAL':
@@ -254,20 +338,20 @@ SampleInitFactoryWebGPU(
             const blockHeight = settings['Next Swap Span'];
             const halfHeight = blockHeight / 2;
             swappedIndex =
-              settings.hoveredElement % blockHeight < halfHeight
-                ? settings.hoveredElement + halfHeight
-                : settings.hoveredElement - halfHeight;
-            swappedElementCell.setValue(swappedIndex);
+              settings['Hovered Cell'] % blockHeight < halfHeight
+                ? settings['Hovered Cell'] + halfHeight
+                : settings['Hovered Cell'] - halfHeight;
+            swappedCellController.setValue(swappedIndex);
           }
           break;
         case 'NONE': {
-          swappedIndex = settings.hoveredElement;
-          swappedElementCell.setValue(swappedIndex);
+          swappedIndex = settings['Hovered Cell'];
+          swappedCellController.setValue(swappedIndex);
         }
         default:
           {
-            swappedIndex = settings.hoveredElement;
-            swappedElementCell.setValue(swappedIndex);
+            swappedIndex = settings['Hovered Cell'];
+            swappedCellController.setValue(swappedIndex);
           }
           break;
       }
@@ -281,26 +365,44 @@ SampleInitFactoryWebGPU(
       }
     };
     const startSortInterval = () => {
+      const currentIntervalSpeed = settings['Sort Speed'];
       completeSortIntervalID = setInterval(() => {
         if (settings['Next Step'] === 'NONE') {
           clearInterval(completeSortIntervalID);
           completeSortIntervalID = null;
         }
+        if (settings['Sort Speed'] !== currentIntervalSpeed) {
+          clearInterval(completeSortIntervalID);
+          completeSortIntervalID = null;
+          startSortInterval();
+        }
         settings.executeStep = true;
-        setSwappedElement();
-      }, settings.sortSpeed);
+        setSwappedCell();
+      }, settings['Sort Speed']);
     };
 
-    // At top level, basic information about the number of elements sorted and the number of threads
-    // deployed per workgroup.
-    gui.add(settings, 'Total Elements', totalElementLengths).onChange(() => {
-      endSortInterval();
-      resizeElementArray();
-    });
-    const totalThreadsCell = gui.add(settings, 'Total Threads');
+    // At top level, information about resources used to execute the compute shader
+    // i.e elements sorted, threads/invocations per workgroup, and workgroups dispatched
+    const computeResourcesFolder = gui.addFolder('Compute Resources');
+    computeResourcesFolder
+      .add(settings, 'Total Elements', totalElementLengths)
+      .onChange(() => {
+        endSortInterval();
+        resizeElementArray();
+      });
+    const totalThreadsController = computeResourcesFolder.add(
+      settings,
+      'Total Threads'
+    );
+    const totalWorkgroupsController = computeResourcesFolder.add(
+      settings,
+      'Total Workgroups'
+    );
+    computeResourcesFolder.open();
 
     // Folder with functions that control the execution of the sort
     const controlFolder = gui.addFolder('Sort Controls');
+    controlFolder.add(settings, 'Sort Speed', 50, 1000).step(50);
     controlFolder.add(settings, 'Execute Sort Step').onChange(() => {
       endSortInterval();
       settings.executeStep = true;
@@ -316,32 +418,45 @@ SampleInitFactoryWebGPU(
     controlFolder.add(settings, 'Complete Sort').onChange(startSortInterval);
     controlFolder.open();
 
-    // Folder with indexes of the hovered element
-    const hoverFolder = gui.addFolder('Hover Information');
-    const hoveredElementCell = hoverFolder
-      .add(settings, 'hoveredElement')
-      .onChange(setSwappedElement);
-    const swappedElementCell = hoverFolder.add(settings, 'swappedElement');
+    // Information about grid display
+    const gridFolder = gui.addFolder('Grid Information');
+    gridFolder.add(settings, 'Display Mode', ['Elements', 'Swap Highlight']);
+    const gridWidthController = gridFolder.add(settings, 'Grid Width');
+    const gridHeightController = gridFolder.add(settings, 'Grid Height');
+    const hoveredCellController = gridFolder
+      .add(settings, 'Hovered Cell')
+      .onChange(setSwappedCell);
+    const swappedCellController = gridFolder.add(settings, 'Swapped Cell');
 
     // Additional Information about the execution state of the sort
     const executionInformationFolder = gui.addFolder('Execution Information');
-    const prevStepCell = executionInformationFolder.add(settings, 'Prev Step');
-    const nextStepCell = executionInformationFolder.add(settings, 'Next Step');
-    const prevBlockHeightCell = executionInformationFolder.add(
+    const stepIndexController = executionInformationFolder.add(
       settings,
-      'Prev Swap Span'
+      'Step Index'
     );
-    const nextBlockHeightCell = executionInformationFolder.add(
+    const totalStepsController = executionInformationFolder.add(
       settings,
-      'Next Swap Span'
+      'Total Steps'
+    );
+    const prevStepController = executionInformationFolder.add(
+      settings,
+      'Prev Step'
     );
-    const gridWidthCell = executionInformationFolder.add(
+    const nextStepController = executionInformationFolder.add(
       settings,
-      'Grid Width'
+      'Next Step'
     );
-    const gridHeightCell = executionInformationFolder.add(
+    const totalSwapsController = executionInformationFolder.add(
       settings,
-      'Grid Height'
+      'Total Swaps'
+    );
+    const prevBlockHeightController = executionInformationFolder.add(
+      settings,
+      'Prev Swap Span'
+    );
+    const nextBlockHeightController = executionInformationFolder.add(
+      settings,
+      'Next Swap Span'
     );
 
     // Adjust styles of Function List Elements within GUI
@@ -365,21 +480,29 @@ SampleInitFactoryWebGPU(
       const xIndex = Math.floor(event.offsetX / cellSize[0]);
       const yIndex =
         settings['Grid Height'] - 1 - Math.floor(event.offsetY / cellSize[1]);
-      hoveredElementCell.setValue(yIndex * settings['Grid Width'] + xIndex);
-      settings.hoveredElement = yIndex * settings['Grid Width'] + xIndex;
+      hoveredCellController.setValue(yIndex * settings['Grid Width'] + xIndex);
+      settings['Hovered Cell'] = yIndex * settings['Grid Width'] + xIndex;
     });
 
     // Deactivate interaction with select GUI elements
-    prevStepCell.domElement.style.pointerEvents = 'none';
-    prevBlockHeightCell.domElement.style.pointerEvents = 'none';
-    nextStepCell.domElement.style.pointerEvents = 'none';
-    nextBlockHeightCell.domElement.style.pointerEvents = 'none';
-    totalThreadsCell.domElement.style.pointerEvents = 'none';
-    gridWidthCell.domElement.style.pointerEvents = 'none';
-    gridHeightCell.domElement.style.pointerEvents = 'none';
+    totalWorkgroupsController.domElement.style.pointerEvents = 'none';
+    hoveredCellController.domElement.style.pointerEvents = 'none';
+    swappedCellController.domElement.style.pointerEvents = 'none';
+    stepIndexController.domElement.style.pointerEvents = 'none';
+    totalStepsController.domElement.style.pointerEvents = 'none';
+    prevStepController.domElement.style.pointerEvents = 'none';
+    prevBlockHeightController.domElement.style.pointerEvents = 'none';
+    nextStepController.domElement.style.pointerEvents = 'none';
+    nextBlockHeightController.domElement.style.pointerEvents = 'none';
+    totalThreadsController.domElement.style.pointerEvents = 'none';
+    gridWidthController.domElement.style.pointerEvents = 'none';
+    gridHeightController.domElement.style.pointerEvents = 'none';
+    totalSwapsController.domElement.style.pointerEvents = 'none';
 
     let highestBlockHeight = 2;
 
+    startSortInterval();
+
     async function frame() {
       if (!pageState.active) return;
 
@@ -416,8 +539,7 @@ SampleInitFactoryWebGPU(
 
       const commandEncoder = device.createCommandEncoder();
       bitonicDisplayRenderer.startRun(commandEncoder, {
-        width: settings['Grid Width'],
-        height: settings['Grid Height'],
+        highlight: settings['Display Mode'] === 'Elements' ? 0 : 1,
       });
       if (
         settings.executeStep &&
@@ -425,28 +547,32 @@ SampleInitFactoryWebGPU(
       ) {
         const computePassEncoder = commandEncoder.beginComputePass();
         computePassEncoder.setPipeline(computePipeline);
-        computePassEncoder.setBindGroup(0, computeBGDescript.bindGroups[0]);
-        computePassEncoder.dispatchWorkgroups(1);
+        computePassEncoder.setBindGroup(0, computeBGCluster.bindGroups[0]);
+        computePassEncoder.dispatchWorkgroups(settings['Total Workgroups']);
         computePassEncoder.end();
-
-        prevStepCell.setValue(settings['Next Step']);
-        prevBlockHeightCell.setValue(settings['Next Swap Span']);
-        nextBlockHeightCell.setValue(settings['Next Swap Span'] / 2);
+        stepIndexController.setValue(settings['Step Index'] + 1);
+        prevStepController.setValue(settings['Next Step']);
+        prevBlockHeightController.setValue(settings['Next Swap Span']);
+        nextBlockHeightController.setValue(settings['Next Swap Span'] / 2);
         if (settings['Next Swap Span'] === 1) {
           highestBlockHeight *= 2;
-          nextStepCell.setValue(
-            highestBlockHeight === settings['Total Elements'] * 2
-              ? 'NONE'
-              : 'FLIP_LOCAL'
-          );
-          nextBlockHeightCell.setValue(
-            highestBlockHeight === settings['Total Elements'] * 2
-              ? 0
-              : highestBlockHeight
-          );
+          if (highestBlockHeight === settings['Total Elements'] * 2) {
+            nextStepController.setValue('NONE');
+            nextBlockHeightController.setValue(0);
+          } else if (highestBlockHeight > settings['Total Threads'] * 2) {
+            nextStepController.setValue('FLIP_GLOBAL');
+            nextBlockHeightController.setValue(highestBlockHeight);
+          } else {
+            nextStepController.setValue('FLIP_LOCAL');
+            nextBlockHeightController.setValue(highestBlockHeight);
+          }
         } else {
-          nextStepCell.setValue('DISPERSE_LOCAL');
+          settings['Next Swap Span'] > settings['Total Threads'] * 2
+            ? nextStepController.setValue('DISPERSE_GLOBAL')
+            : nextStepController.setValue('DISPERSE_LOCAL');
         }
+
+        // Copy GPU accessible buffers to CPU accessible buffers
         commandEncoder.copyBufferToBuffer(
           elementsOutputBuffer,
           0,
@@ -454,6 +580,14 @@ SampleInitFactoryWebGPU(
           0,
           elementsBufferSize
         );
+
+        commandEncoder.copyBufferToBuffer(
+          atomicSwapsOutputBuffer,
+          0,
+          atomicSwapsStagingBuffer,
+          0,
+          Uint32Array.BYTES_PER_ELEMENT
+        );
       }
       device.queue.submit([commandEncoder.finish()]);
 
@@ -468,16 +602,33 @@ SampleInitFactoryWebGPU(
           0,
           elementsBufferSize
         );
+        // Copy atomic swaps data to CPU
+        await atomicSwapsStagingBuffer.mapAsync(
+          GPUMapMode.READ,
+          0,
+          Uint32Array.BYTES_PER_ELEMENT
+        );
+        const copySwapsBuffer = atomicSwapsStagingBuffer.getMappedRange(
+          0,
+          Uint32Array.BYTES_PER_ELEMENT
+        );
         // Get correct range of data from CPU copy of GPU Data
         const elementsData = copyElementsBuffer.slice(
           0,
           Uint32Array.BYTES_PER_ELEMENT * settings['Total Elements']
         );
+        const swapsData = copySwapsBuffer.slice(
+          0,
+          Uint32Array.BYTES_PER_ELEMENT
+        );
         // Extract data
         const elementsOutput = new Uint32Array(elementsData);
+        totalSwapsController.setValue(new Uint32Array(swapsData)[0]);
         elementsStagingBuffer.unmap();
+        atomicSwapsStagingBuffer.unmap();
+        // Elements output becomes elements input, swap accumulate
         elements = elementsOutput;
-        setSwappedElement();
+        setSwappedCell();
       }
       settings.executeStep = false;
       requestAnimationFrame(frame);
@@ -509,7 +660,11 @@ const bitonicSortExample: () => JSX.Element = () =>
       },
       {
         name: './bitonicCompute.frag.wgsl',
-        contents: NaiveBitonicCompute(16),
+        contents: NaiveBitonicCompute(64),
+      },
+      {
+        name: './atomicToZero.wgsl',
+        contents: atomicToZero,
       },
     ],
     filename: __filename,
diff --git a/src/sample/bitonicSort/utils.ts b/src/sample/bitonicSort/utils.ts
index fea2992f..8d6096fe 100644
--- a/src/sample/bitonicSort/utils.ts
+++ b/src/sample/bitonicSort/utils.ts
@@ -9,7 +9,10 @@ type BindGroupBindingLayout =
   | GPUStorageTextureBindingLayout
   | GPUExternalTextureBindingLayout;
 
-export type BindGroupsObjectsAndLayout = {
+// An object containing
+// 1. A generated Bind Group Layout
+// 2. An array of Bind Groups that accord to that layout
+export type BindGroupCluster = {
   bindGroups: GPUBindGroup[];
   bindGroupLayout: GPUBindGroupLayout;
 };
@@ -27,7 +30,7 @@ type ResourceTypeName =
  * @param {ResourceTypeName[]} resourceTypes - The resourceType at the corresponding index.
  * @returns {BindGroupsObjectsAndLayout} An object containing an array of bindGroups and the bindGroupLayout they implement.
  */
-export const createBindGroupDescriptor = (
+export const createBindGroupCluster = (
   bindings: number[],
   visibilities: number[],
   resourceTypes: ResourceTypeName[],
@@ -35,14 +38,14 @@ export const createBindGroupDescriptor = (
   resources: GPUBindingResource[][],
   label: string,
   device: GPUDevice
-): BindGroupsObjectsAndLayout => {
+): BindGroupCluster => {
   const layoutEntries: GPUBindGroupLayoutEntry[] = [];
   for (let i = 0; i < bindings.length; i++) {
-    const layoutEntry: any = {};
-    layoutEntry.binding = bindings[i];
-    layoutEntry.visibility = visibilities[i % visibilities.length];
-    layoutEntry[resourceTypes[i]] = resourceLayouts[i];
-    layoutEntries.push(layoutEntry);
+    layoutEntries.push({
+      binding: bindings[i],
+      visibility: visibilities[i % visibilities.length],
+      [resourceTypes[i]]: resourceLayouts[i],
+    });
   }
 
   const bindGroupLayout = device.createBindGroupLayout({
@@ -58,10 +61,10 @@ export const createBindGroupDescriptor = (
   for (let i = 0; i < resources.length; i++) {
     const groupEntries: GPUBindGroupEntry[] = [];
     for (let j = 0; j < resources[0].length; j++) {
-      const groupEntry: any = {};
-      groupEntry.binding = j;
-      groupEntry.resource = resources[i][j];
-      groupEntries.push(groupEntry);
+      groupEntries.push({
+        binding: j,
+        resource: resources[i][j],
+      });
     }
     const newBindGroup = device.createBindGroup({
       label: `${label}.bindGroup${i}`,