ngEHT conversion guide

[1]:
from importlib.metadata import version
import os

try:
    import xradio

    print("XRADIO version", version("xradio"), "already installed.")
except ImportError as e:
    print(e)
    print("Installing XRADIO")

    os.system("pip install xradio")

    import xradio

    print("xradio version", version("xradio"), " installed.")
XRADIO version 1.1.3 already installed.

Download dataset

fitsidi from https://almascience.eso.org/almadata/ec/eht/2016.1.01114.V/group.uid___A001_X87c_X245.ec_jlgomez.e17a10-7-hi-oj287-3C279-fits.tgz

importfitsidi('E17A10.0.bin0000.source0000.FITS',vis='E17A10.0.bin0000.source0000.ms')
mstransform(vis='E17A10.0.bin0000.source0000.ms',outputvis='ngEHT_E17A10.0.bin0000.source0000_split_lsrk.ms',spw='8:55~61,29:20~27', regridms=True,outframe='lsrk',datacolumn='all')
[2]:
import toolviper

toolviper.utils.data.download(file="ngEHT_E17A10.0.bin0000.source0000_split.ms")
[2026-04-20 15:19:36,129]     INFO   toolviper:  Initializing download...
[2026-04-20 15:19:36,130]     INFO   toolviper:  File already exists: /Users/vdesouza/work/xradio/docs/source/measurement_set/guides/ngEHT_E17A10.0.bin0000.source0000_split.ms

Convert to Processing Set

[3]:
from xradio.measurement_set import convert_msv2_to_processing_set

ms_file = "ngEHT_E17A10.0.bin0000.source0000_split.ms"

main_chunksize = {"frequency": 1, "time": 20}  # baseline, polarization
outfile = "ngEHT_E17A10.0.bin0000.source0000_split_lsrk.ps.zarr"
convert_msv2_to_processing_set(
    in_file=ms_file,
    out_file=outfile,
    parallel_mode="none",
    persistence_mode='w',
    main_chunksize=main_chunksize,
)
[2026-04-20 15:19:36,642]     INFO   toolviper:  Updated partition scheme used: ['DATA_DESC_ID', 'OBSERVATION_ID']
[2026-04-20 15:19:36,643]     INFO   toolviper:  Number of partitions: 2
[2026-04-20 15:19:36,643]     INFO   toolviper:  OBSERVATION_ID [0], DDI [0], STATE [None], FIELD [0], SCAN [0], EPHEMERIS [None]
[2026-04-20 15:19:36,717]  WARNING   toolviper:  Source_id is -1. No source information will be included in the field_and_source_xds.
[2026-04-20 15:19:37,145]     INFO   toolviper:  OBSERVATION_ID [0], DDI [1], STATE [None], FIELD [0], SCAN [0], EPHEMERIS [None]
[2026-04-20 15:19:37,217]  WARNING   toolviper:  Source_id is -1. No source information will be included in the field_and_source_xds.

Processing Set

[4]:
from xradio.measurement_set import open_processing_set

ps_xdt = open_processing_set(ps_store=outfile)
ps_xdt.xr_ps.summary()
[4]:
name scan_intents shape execution_block_UID polarization scan_name spw_name spw_intents field_name source_name line_name field_coords session_reference_UID scheduling_block_UID project_UID start_frequency end_frequency
0 ngEHT_E17A10.0.bin0000.source0000_split_0 [None] (2250, 20, 7, 4) --- [RR, RL, LR, LL] [0] spw_0 [UNSPECIFIED] [3C279_0] [Unknown] [] [fk5, 12h56m11.17s, -5d47m21.52s] --- --- E17A10 2.286593e+11 2.286623e+11
1 ngEHT_E17A10.0.bin0000.source0000_split_1 [None] (2250, 20, 8, 4) --- [RR, RL, LR, LL] [0] spw_1 [UNSPECIFIED] [3C279_0] [Unknown] [] [fk5, 12h56m11.17s, -5d47m21.52s] --- --- E17A10 2.298723e+11 2.298758e+11
[5]:
ms_xdt = ps_xdt["ngEHT_E17A10.0.bin0000.source0000_split_0"]
ms_xdt
[5]:
<xarray.DataTree 'ngEHT_E17A10.0.bin0000.source0000_split_0'>
Group: /ngEHT_E17A10.0.bin0000.source0000_split_0
│   Dimensions:                     (time: 2250, baseline_id: 20, frequency: 7,
│                                    polarization: 4, uvw_label: 3)
│   Coordinates:
│     * time                        (time) float64 18kB 1.492e+09 ... 1.492e+09
│       field_name                  (time) <U27 243kB dask.array<chunksize=(2250,), meta=np.ndarray>
│       scan_name                   (time) <U21 189kB dask.array<chunksize=(2250,), meta=np.ndarray>
│     * baseline_id                 (baseline_id) int64 160B 0 1 2 3 ... 16 17 18 19
│       baseline_antenna1_name      (baseline_id) <U2 160B dask.array<chunksize=(20,), meta=np.ndarray>
│       baseline_antenna2_name      (baseline_id) <U2 160B dask.array<chunksize=(20,), meta=np.ndarray>
│     * frequency                   (frequency) float64 56B 2.287e+11 ... 2.287e+11
│     * polarization                (polarization) <U2 32B 'RR' 'RL' 'LR' 'LL'
│     * uvw_label                   (uvw_label) <U1 12B 'u' 'v' 'w'
│   Data variables:
│       EFFECTIVE_INTEGRATION_TIME  (time, baseline_id) float64 360kB dask.array<chunksize=(20, 20), meta=np.ndarray>
│       FLAG                        (time, baseline_id, frequency, polarization) bool 1MB dask.array<chunksize=(20, 20, 1, 4), meta=np.ndarray>
│       TIME_CENTROID               (time, baseline_id) float64 360kB dask.array<chunksize=(20, 20), meta=np.ndarray>
│       UVW                         (time, baseline_id, uvw_label) float64 1MB dask.array<chunksize=(20, 20, 3), meta=np.ndarray>
│       VISIBILITY                  (time, baseline_id, frequency, polarization) complex64 10MB dask.array<chunksize=(20, 20, 1, 4), meta=np.ndarray>
│       WEIGHT                      (time, baseline_id, frequency, polarization) float32 5MB dask.array<chunksize=(20, 20, 1, 4), meta=np.ndarray>
│   Attributes:
│       creation_date:     2026-04-20T21:19:36.659187+00:00
│       creator:           {'software_name': 'xradio', 'version': '1.1.3'}
│       data_groups:       {'base': {'correlated_data': 'VISIBILITY', 'date': '20...
│       observation_info:  {'observer': ['PLUTO'], 'observing_log': '[]', 'projec...
│       processor_info:    {'sub_type': '', 'type': ''}
│       schema_version:    4.0.0
│       type:              visibility
├── Group: /ngEHT_E17A10.0.bin0000.source0000_split_0/antenna_xds
│       Dimensions:                 (antenna_name: 6, cartesian_pos_label: 3,
│                                    receptor_label: 2)
│       Coordinates:
│         * antenna_name            (antenna_name) <U2 48B 'AA' 'AP' 'AZ' 'LM' 'PV' 'SP'
│           mount                   (antenna_name) <U16 384B dask.array<chunksize=(6,), meta=np.ndarray>
│           station_name            (antenna_name) <U2 48B dask.array<chunksize=(6,), meta=np.ndarray>
│           telescope_name          (antenna_name) <U4 96B dask.array<chunksize=(6,), meta=np.ndarray>
│         * cartesian_pos_label     (cartesian_pos_label) <U1 12B 'x' 'y' 'z'
│         * receptor_label          (receptor_label) <U5 40B 'pol_0' 'pol_1'
│           polarization_type       (antenna_name, receptor_label) <U1 48B dask.array<chunksize=(6, 2), meta=np.ndarray>
│       Data variables:
│           ANTENNA_DISH_DIAMETER   (antenna_name) float64 48B dask.array<chunksize=(6,), meta=np.ndarray>
│           ANTENNA_POSITION        (antenna_name, cartesian_pos_label) float64 144B dask.array<chunksize=(6, 3), meta=np.ndarray>
│           ANTENNA_RECEPTOR_ANGLE  (antenna_name, receptor_label) float64 96B dask.array<chunksize=(6, 2), meta=np.ndarray>
│       Attributes:
│           overall_telescope_name:  VLBA
│           relocatable_antennas:    False
│           type:                    antenna
└── Group: /ngEHT_E17A10.0.bin0000.source0000_split_0/field_and_source_base_xds
        Dimensions:                       (field_name: 1, sky_dir_label: 2)
        Coordinates:
          * field_name                    (field_name) <U27 108B '3C279_0'
            source_name                   (field_name) <U7 28B dask.array<chunksize=(1,), meta=np.ndarray>
          * sky_dir_label                 (sky_dir_label) <U3 24B 'ra' 'dec'
        Data variables:
            FIELD_PHASE_CENTER_DIRECTION  (field_name, sky_dir_label) float64 16B dask.array<chunksize=(1, 2), meta=np.ndarray>
        Attributes:
            type:     field_and_source
[6]:
ms_xdt.antenna_xds.compute()
[6]:
<xarray.DataTree 'antenna_xds'>
Group: /
    Dimensions:                 (time: 2250, baseline_id: 20, frequency: 7,
                                 polarization: 4, uvw_label: 3, antenna_name: 6,
                                 cartesian_pos_label: 3, receptor_label: 2)
    Coordinates:
      * time                    (time) float64 18kB 1.492e+09 ... 1.492e+09
      * baseline_id             (baseline_id) int64 160B 0 1 2 3 4 ... 16 17 18 19
      * frequency               (frequency) float64 56B 2.287e+11 ... 2.287e+11
      * polarization            (polarization) <U2 32B 'RR' 'RL' 'LR' 'LL'
      * uvw_label               (uvw_label) <U1 12B 'u' 'v' 'w'
      * antenna_name            (antenna_name) <U2 48B 'AA' 'AP' 'AZ' 'LM' 'PV' 'SP'
        mount                   (antenna_name) <U16 384B 'ALT-AZ' ... 'ALT-AZ'
        station_name            (antenna_name) <U2 48B 'AA' 'AP' 'AZ' 'LM' 'PV' 'SP'
        telescope_name          (antenna_name) <U4 96B 'VLBA' 'VLBA' ... 'VLBA'
      * cartesian_pos_label     (cartesian_pos_label) <U1 12B 'x' 'y' 'z'
      * receptor_label          (receptor_label) <U5 40B 'pol_0' 'pol_1'
        polarization_type       (antenna_name, receptor_label) <U1 48B 'R' ... 'L'
    Data variables:
        ANTENNA_DISH_DIAMETER   (antenna_name) float64 48B 12.0 12.0 ... 30.0 10.0
        ANTENNA_POSITION        (antenna_name, cartesian_pos_label) float64 144B ...
        ANTENNA_RECEPTOR_ANGLE  (antenna_name, receptor_label) float64 96B 0.0 .....
    Attributes:
        overall_telescope_name:  VLBA
        relocatable_antennas:    False
        type:                    antenna
[7]:
ms_xdt.xr_ms.get_field_and_source_xds()
[7]:
<xarray.DatasetView> Size: 18kB
Dimensions:                       (field_name: 1, sky_dir_label: 2,
                                   baseline_id: 20, frequency: 7,
                                   polarization: 4, time: 2250, uvw_label: 3)
Coordinates:
  * field_name                    (field_name) <U27 108B '3C279_0'
    source_name                   (field_name) <U7 28B dask.array<chunksize=(1,), meta=np.ndarray>
  * sky_dir_label                 (sky_dir_label) <U3 24B 'ra' 'dec'
  * baseline_id                   (baseline_id) int64 160B 0 1 2 3 ... 17 18 19
  * frequency                     (frequency) float64 56B 2.287e+11 ... 2.287...
  * polarization                  (polarization) <U2 32B 'RR' 'RL' 'LR' 'LL'
  * time                          (time) float64 18kB 1.492e+09 ... 1.492e+09
  * uvw_label                     (uvw_label) <U1 12B 'u' 'v' 'w'
Data variables:
    FIELD_PHASE_CENTER_DIRECTION  (field_name, sky_dir_label) float64 16B dask.array<chunksize=(1, 2), meta=np.ndarray>
Attributes:
    type:     field_and_source
[8]:
ps_xdt.xr_ps.plot_antenna_positions_2d()
../../_images/measurement_set_guides_ngEHT_12_0.png
[9]:
ps_xdt.xr_ps.plot_phase_centers()
../../_images/measurement_set_guides_ngEHT_13_0.png