%matplotlib inline

import os
from pathlib import Path
from time import time
import warnings

import numpy as np
import matplotlib.pyplot as plt
plt.style.use('seaborn-colorblind')

import astropy.units as u
from astropy.io import fits

from spectral_cube import SpectralCube

import scipy.ndimage as nd

/tmp/ipykernel_2355/442262762.py:10: MatplotlibDeprecationWarning: The seaborn styles shipped by Matplotlib are deprecated since 3.6, as they no longer correspond to the styles shipped by seaborn. However, they will remain available as 'seaborn-v0_8-<style>'. Alternatively, directly use the seaborn API instead.
  plt.style.use('seaborn-colorblind')

from astropy.utils.data import download_file

filename = download_file(
    'https://zenodo.org/record/4050489/files/M33_ALMA_ACA_12CO21.cutout.fits',
    cache=True, show_progress=True)

# Note that the datafile will not end in ".fits". Because of that, we need to specify the format
# When the file name end in "fits", `format` will not need to be specified 
cube = SpectralCube.read(filename, format='fits', use_dask=False)

# Convert to km/s for the spectral unit
cube = cube.with_spectral_unit(u.km / u.s)

cube

SpectralCube with shape=(300, 64, 64) and unit=K:
 n_x:     64  type_x: RA---SIN  unit_x: deg    range:    23.408277 deg:   23.428647 deg
 n_y:     64  type_y: DEC--SIN  unit_y: deg    range:    30.750561 deg:   30.768065 deg
 n_s:    300  type_s: VRAD      unit_s: km / s  range:     -280.000 km / s:     -79.670 km / s

peak_intensity = cube.max(axis=0) # Take the maximum along the spectral dimension

# Quick vizualization
peak_intensity.quicklook()

WARNING: PossiblySlowWarning: This function (<function BaseSpectralCube.max at 0x7f885d8ed090>) requires loading the entire cube into memory and may therefore be slow. [spectral_cube.utils]

mad_std_spectrum = cube.mad_std(axis=(1, 2))

plt.plot(mad_std_spectrum.spectral_axis.value, mad_std_spectrum.value, drawstyle='steps-mid')
plt.xlabel('Velocity (km/s)')
plt.ylabel(r' Noise standard deviation $\sigma$ (K)')

# Best to extend the range to 0.
plt.ylim([0., 0.12])

plt.axhline(0.08, linestyle='--', color='k', linewidth=3, label='A priori noise expectation')
plt.legend(frameon=True)

WARNING: PossiblySlowWarning: This function (<function BaseSpectralCube.mad_std at 0x7f885d8ecee0>) requires loading the entire cube into memory and may therefore be slow. [spectral_cube.utils]

<matplotlib.legend.Legend at 0x7f88805566e0>

cube_sclip = cube.sigma_clip_spectrally(3) # Clip values above 3-sigma

mad_std_spectrum_sclip = cube_sclip.mad_std(axis=(1, 2))

plt.plot(mad_std_spectrum_sclip.spectral_axis.value, mad_std_spectrum_sclip.value, drawstyle='steps-mid')
plt.xlabel('Velocity (km/s)')
plt.ylabel(r' Noise standard deviation $\sigma$ (K)')

# Best to extend the range to 0.
plt.ylim([0., 0.12])

plt.axhline(0.08, linestyle='--', color='k', linewidth=3, label='A priori noise expectation')
plt.legend(frameon=True)

WARNING: PossiblySlowWarning: This function (<function BaseSpectralCube.mad_std at 0x7f885d8ecee0>) requires loading the entire cube into memory and may therefore be slow. [spectral_cube.utils]

<matplotlib.legend.Legend at 0x7f885ca88100>

mad_std_map_sclip = cube_sclip.mad_std(axis=0) # Calculate sigma along the spectral dimension

mad_std_map_sclip.quicklook()

WARNING: PossiblySlowWarning: This function (<function BaseSpectralCube.mad_std at 0x7f885d8ecee0>) requires loading the entire cube into memory and may therefore be slow. [spectral_cube.utils]

# Make a low and high mask
low_snr_mask = (cube > 3 * mad_std_map_sclip).include()
high_snr_mask = (cube > 6 * mad_std_map_sclip).include()

import scipy.ndimage as nd

structure = np.ones((3, 3, 3), dtype=bool)

low_snr_mask_labels, num_labels = nd.label(low_snr_mask,
                                           structure=structure)

print(f"Initial number of regions found: {num_labels}")

Initial number of regions found: 336

# From the labels, count the number of pixels within each label.

num_pixels_in_low_snr_mask = nd.sum(low_snr_mask,
                                    labels=low_snr_mask_labels,
                                    index=range(1, num_labels + 1)) # +1 offset for mask labels

# Repeat for the high signal mask.
# NOTE: the high_snr_mask is only used for counting pixels in the low_snr_mask, hence
# the repeated use of low_snr_mask_labels here.
num_pixels_in_high_snr_mask = nd.sum(high_snr_mask,
                                     labels=low_snr_mask_labels,
                                     index=range(1, num_labels + 1)) # +1 offset for mask labels

# Create a new empty mask to add the valid regions to
signal_mask = np.zeros_like(low_snr_mask)

low_min_pixels = 40
high_min_pixels = 5

for num, (high_pix_num, low_pix_num) in enumerate(zip(num_pixels_in_high_snr_mask, num_pixels_in_low_snr_mask)):
    if high_pix_num >= high_min_pixels and low_pix_num >= low_min_pixels:

        # Add regions that pass the criteria.
        # NOTE: enumerate will start with 0, but the mask labels start at 1
        # We apply a +1 offset to `num` to account for this.
        signal_mask[low_snr_mask_labels == num + 1] = True

signal_mask_labels, num_labels = nd.label(signal_mask,
                                          structure=structure)

print(f"Final number of regions found: {num_labels}")

Final number of regions found: 3

# Use a structure that will increase the mask size by 1 pixel in each direction.
# Because we are applying it to the 3D cube, we need its size to be (3, 3, 3):

# In the spatial dimension, expand by 1 pixel in each direction.
# The structure looks like:
# [1, 1, 1]
# [1, 1, 1]
# [1, 1, 1]
structure = np.ones((3, 3), dtype=bool)

# In the spectral dimension, only expand the original pixel along the spectral dimension.
# The structure looks like:
# [0, 0, 0]
# [0, 1, 0]
# [0, 0, 0]

structure_spec = np.zeros((3, 3), dtype=bool)
structure_spec[1, 1] = True

# Add 1 spectral element on each side of the spatial structure.
# np.dstack stacks the arrays along a new 3rd dimension:
structure = np.dstack([structure_spec, structure, structure_spec])

signal_mask = nd.binary_dilation(signal_mask, structure=structure, iterations=1)

masked_cube = cube.with_mask(signal_mask)

peak_intensity_sigmask = masked_cube.max(axis=0)

peak_intensity_sigmask.quicklook()

WARNING: PossiblySlowWarning: This function (<function BaseSpectralCube.max at 0x7f885d8ed090>) requires loading the entire cube into memory and may therefore be slow. [spectral_cube.utils]
/opt/hostedtoolcache/Python/3.10.14/x64/lib/python3.10/site-packages/spectral_cube/spectral_cube.py:439: RuntimeWarning: All-NaN slice encountered
  out = function(self._get_filled_data(fill=fill,

centre_spectrum = cube[:, 32, 32]
centre_spectrum_sigmask = masked_cube[:, 32, 32]

plt.plot(centre_spectrum.spectral_axis.value,
         centre_spectrum.filled_data[:].value,
         drawstyle='steps-mid', label='Original')
plt.plot(centre_spectrum_sigmask.spectral_axis.value,
         centre_spectrum_sigmask.filled_data[:].value, drawstyle='steps-mid',
         linewidth=3, label='Masked', color='orange')

plt.legend(frameon=True)

plt.xlabel("Velocity (km/s)")
plt.ylabel('Brightness Temp. (K)')

Text(0, 0.5, 'Brightness Temp. (K)')

masked_moment0 = masked_cube.moment0()

ax = plt.subplot(projection=masked_moment0.wcs)
im = ax.imshow(masked_moment0.value, origin='lower', cmap='inferno')
cbar = plt.colorbar(im)
cbar.set_label(f'Integrated Intensity ({masked_moment0.unit})')

ax.set_ylabel('Declination')
ax.set_xlabel('Right Ascension')

masked_moment1 = masked_cube.moment1()

ax = plt.subplot(projection=masked_moment1.wcs)
im = ax.imshow(masked_moment1.value, origin='lower', cmap='coolwarm')
cbar = plt.colorbar(im)
cbar.set_label(f'Centroid ({masked_moment1.unit})')

ax.set_ylabel('Declination')
ax.set_xlabel('Right Ascension')

/opt/hostedtoolcache/Python/3.10.14/x64/lib/python3.10/site-packages/spectral_cube/_moments.py:168: RuntimeWarning: invalid value encountered in divide
  return (np.nansum(data * pix_cen, axis=axis) /

unmasked_moment1 = cube.moment1()

ax = plt.subplot(projection=unmasked_moment1.wcs)
im = ax.imshow(unmasked_moment1.value, origin='lower', cmap='coolwarm')
cbar = plt.colorbar(im)
cbar.set_label('Centroid (km/s)')

ax.set_ylabel('Declination')
ax.set_xlabel('Right Ascension')

masked_moment2 = masked_cube.moment2()

WARNING: VarianceWarning: Note that the second moment returned will be a variance map. To get a linewidth map, use the SpectralCube.linewidth_fwhm() or SpectralCube.linewidth_sigma() methods instead. [spectral_cube.spectral_cube]
/opt/hostedtoolcache/Python/3.10.14/x64/lib/python3.10/site-packages/spectral_cube/_moments.py:168: RuntimeWarning: invalid value encountered in divide
  return (np.nansum(data * pix_cen, axis=axis) /
/opt/hostedtoolcache/Python/3.10.14/x64/lib/python3.10/site-packages/spectral_cube/_moments.py:178: RuntimeWarning: invalid value encountered in divide
  return (np.nansum(data * (pix_cen - mom1) ** order, axis=axis) /

masked_linewidth = masked_cube.linewidth_sigma()

ax = plt.subplot(projection=masked_linewidth.wcs)
im = ax.imshow(masked_linewidth.value, origin='lower', cmap='coolwarm')
cbar = plt.colorbar(im)
cbar.set_label(f'Line Width ({masked_linewidth.unit})')

ax.set_ylabel('Declination')
ax.set_xlabel('Right Ascension')

masked_fwhm = masked_cube.linewidth_fwhm()

unmasked_linewidth = cube.linewidth_sigma()

ax = plt.subplot(projection=unmasked_linewidth.wcs)
im = ax.imshow(unmasked_linewidth.value, origin='lower', cmap='coolwarm')
cbar = plt.colorbar(im)
cbar.set_label(f'Line Width ({unmasked_linewidth.unit})')

ax.set_ylabel('Declination')
ax.set_xlabel('Right Ascension')

n = 3

nth_moment = masked_cube.moment(order=n)

ax = plt.subplot(projection=nth_moment.wcs)
im = ax.imshow(nth_moment.value, origin='lower', cmap='coolwarm')
cbar = plt.colorbar(im)
cbar.set_label(f'Order {n} Moment (km/s)^{n}')

ax.set_ylabel('Declination')
ax.set_xlabel('Right Ascension')

/opt/hostedtoolcache/Python/3.10.14/x64/lib/python3.10/site-packages/spectral_cube/_moments.py:168: RuntimeWarning: invalid value encountered in divide
  return (np.nansum(data * pix_cen, axis=axis) /
/opt/hostedtoolcache/Python/3.10.14/x64/lib/python3.10/site-packages/spectral_cube/_moments.py:178: RuntimeWarning: invalid value encountered in divide
  return (np.nansum(data * (pix_cen - mom1) ** order, axis=axis) /

masked_tpeak = masked_cube.max(axis=0)

ax = plt.subplot(projection=masked_tpeak.wcs)
ax = plt.subplot()
im = ax.imshow(masked_tpeak.value, origin='lower', cmap='coolwarm')
cbar = plt.colorbar(im)
cbar.set_label(f'Peak Temperature ({masked_tpeak.unit})')

ax.set_ylabel('Declination')
ax.set_xlabel('Right Ascension')

WARNING: PossiblySlowWarning: This function (<function BaseSpectralCube.max at 0x7f885d8ed090>) requires loading the entire cube into memory and may therefore be slow. [spectral_cube.utils]
/opt/hostedtoolcache/Python/3.10.14/x64/lib/python3.10/site-packages/spectral_cube/spectral_cube.py:439: RuntimeWarning: All-NaN slice encountered
  out = function(self._get_filled_data(fill=fill,

masked_peakvelocity = masked_cube.argmax_world(axis=0)

ax = plt.subplot(projection=masked_peakvelocity.wcs)
ax = plt.subplot()
im = ax.imshow(masked_peakvelocity.value, origin='lower', cmap='coolwarm')
cbar = plt.colorbar(im)
cbar.set_label(f'Velocity at peak temperature ({masked_peakvelocity.unit})')

ax.set_ylabel('Declination')
ax.set_xlabel('Right Ascension')

WARNING: PossiblySlowWarning: This function (<function BaseSpectralCube.argmax_world at 0x7f885d8ed7e0>) requires loading the entire cube into memory and may therefore be slow. [spectral_cube.utils]
WARNING: PossiblySlowWarning: This function (<function BaseSpectralCube.argmax at 0x7f885d8ed3f0>) requires loading the entire cube into memory and may therefore be slow. [spectral_cube.utils]

from dask_image import ndmeasure
from dask_image import ndmorph
from dask import array as da

import warnings

# Uncomment to create a progress bar for all dask operations.
# Disabled here as it increases the run time significantly for this small cube.
# from dask.diagnostics import ProgressBar
# pbar = ProgressBar()
# pbar.register()

with warnings.catch_warnings():
    warnings.simplefilter('ignore')
    
    # Load cube
    cube = SpectralCube.read(filename, format='fits', use_dask=True)
    # Convert to km/s for the spectral unit
    cube = cube.with_spectral_unit(u.km / u.s)

    # Apply sigma clipping to estimate spatial noise variation
    cube_sclip = cube.sigma_clip_spectrally(3)
    mad_std_map_sclip = cube_sclip.mad_std(axis=0) # Calculate sigma along the spectral dimension

    # Make a low and high SNR mask
    low_snr_mask = (cube > 3 * mad_std_map_sclip).include()
    high_snr_mask = (cube > 6 * mad_std_map_sclip).include()



    # Find connected structures
    structure = np.ones((3, 3, 3), dtype=bool)

    low_snr_mask_labels, num_labels = ndmeasure.label(low_snr_mask,
                                                      structure=structure)

    # Ask dask to execute the operation
    num_labels = num_labels.compute()

    print(f"Initial number of regions found: {num_labels}")


    # From the labels, count the number of pixels within each label.

    # Count how many >6 sigma pixels (high_snr_mask) are within regions defined in low_snr_mask_labels
    num_pixels_in_high_snr_mask = ndmeasure.sum_labels(high_snr_mask,
                                                       label_image=low_snr_mask_labels,
                                                       index=range(1, num_labels + 1)) # +1 offset for mask labels

    # Count how many >3 sigma pixels (low_snr_mask) are within regions defined in low_snr_mask_labels.
    num_pixels_in_low_snr_mask = ndmeasure.sum_labels(low_snr_mask,
                                                      label_image=low_snr_mask_labels,
                                                      index=range(1, num_labels + 1)) # +1 offset for mask labels

    # To preserve the low_snr_mask, we will create a new signal mask where we will remove 
    # regions that do not pass the criteria.
    signal_mask = low_snr_mask
    # NOTE: this is memory efficient but may be slower than defining a new empty array and adding the 
    #       (often fewer) number of regions that pass the minimum pixel criteria. See the scipy example
    #       above on using this alternative approach.

    low_min_pixels = 40
    high_min_pixels = 5

    for num, (high_pix_num, low_pix_num) in enumerate(zip(num_pixels_in_high_snr_mask, num_pixels_in_low_snr_mask)):
        if high_pix_num >= high_min_pixels and low_pix_num >= low_min_pixels:
            # This region passes the criteria. Keep it in the mask.
            continue

        # Remove regions that do not pass the criteria.
        # NOTE: enumerate will start with 0, but the mask labels start at 1
        # We apply a +1 offset to `num` to account for this.
        signal_mask[low_snr_mask_labels == num + 1] = False


    # Label the final set of regions.
    signal_mask_labels, num_labels = ndmeasure.label(signal_mask,
                                                      structure=structure)

    num_labels = num_labels.compute()

    signal_mask_labels, num_labels = nd.label(signal_mask,
                                              structure=structure)

    print(f"Final number of regions found: {num_labels}")


    # Dilate the signal mask.
    # Use a structure that will increase the mask size by 1 pixel in each direction.
    # Because we are applying it to the 3D cube, we need its size to be (3, 3, 3):

    # In the spatial dimension, expand by 1 pixel in each direction.
    # The structure looks like:
    # [1, 1, 1]
    # [1, 1, 1]
    # [1, 1, 1]
    structure = np.ones((3, 3), dtype=bool)

    # In the spectral dimension, only expand the original pixel along the spectral dimension.
    # The structure looks like:
    # [0, 0, 0]
    # [0, 1, 0]
    # [0, 0, 0]

    structure_spec = np.zeros((3, 3), dtype=bool)
    structure_spec[1, 1] = True

    # Add 1 spectral element on each side of the spatial structure.
    # np.dstack stacks the arrays along a new 3rd dimension:
    structure = np.dstack([structure_spec, structure, structure_spec])

    # Convert to a dask array
    structure = da.from_array(structure)

    signal_mask = ndmorph.binary_dilation(signal_mask, structure=structure, iterations=1)

    # Now have dask compute all the mask operations.
    signal_mask = signal_mask.compute()

    masked_cube = cube.with_mask(signal_mask)

Initial number of regions found: 360

Final number of regions found: 3

masked_moment0_dask = masked_cube.moment0()

ax = plt.subplot(projection=masked_moment0.wcs)
im = ax.imshow(masked_moment0_dask.value, origin='lower', cmap='inferno')
cbar = plt.colorbar(im)
cbar.set_label(f'Integrated Intensity ({masked_moment0_dask.unit})')

ax.set_ylabel('Declination')
ax.set_xlabel('Right Ascension')

Signal identification and spectral moments in spectral-cube¶

Authors¶

Summary¶

Learning goals¶

Keywords¶

Requires¶

Signal identification and noise estimation¶

Calculating moment maps¶

Integrated Intensity -- Moment 0¶

Centroid Velocity -- Moment 1¶

Line width -- (Square root) Moment 2¶

Higher-order moments¶

Spectra that are not single Gaussians¶

Other common and useful properties¶

Using dask¶