-
Notifications
You must be signed in to change notification settings - Fork 1
/
aartfaac_RT_calib_v1.tex~
1870 lines (1665 loc) · 115 KB
/
aartfaac_RT_calib_v1.tex~
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
% \documentclass[referee]{aa}
\documentclass{aa}
\usepackage[varg]{txfonts}
\usepackage{color}
\usepackage{graphicx}
%% \usepackage{subfig} %% For generating a grid of figures.
\usepackage{caption}
\usepackage{subcaption}
%% \usepackage{float}
%% \usepackage{epstopdf}
%% \newsavebox\mybox %% For generating figure captions which wrap at figure edges.
%% \newlength\myboxlen
%% \newcommand{\figcap}[2]
%% {%
%% \sbox\mybox{#1}
%% \settowidth{\myboxlen}{\usebox{\mybox}}
%% \centering
%% \usebox\mybox
%% \hskip \textwidth
%% \parbox{\myboxlen}{#2}
%% }
\usepackage{bm}
\bibpunct{(}{)}{;}{a}{}{,} % to follow the A&A style
%% From Wijnholds, for better figure placement
\renewcommand\floatpagefraction{1.0}
\renewcommand\topfraction{1.0}
\renewcommand\bottomfraction{1.0}
\renewcommand\textfraction{0.0}
\begin{document}
\title{Real-time calibration of the AARTFAAC array for transient detection}
\author{P. Prasad \inst{1,2}
\and S. J. Wijnholds \inst{3}
\and F. Huizinga \inst{4}
\and R.A.M.J Wijers \inst{5}}
\institute
{Anton Pannekoek Institute, University of Amsterdam,
Postbus 94249, 1090 GE Amsterdam, The Netherlands\email{[email protected]}
\and
ASTRON, The Netherlands Foundation for Radio Astronomy,
PO Box 2, 7990 AA Dwingeloo, The Netherlands\email{[email protected]}
\and
ASTRON, The Netherlands Foundation for Radio Astronomy,
PO Box 2, 7990 AA Dwingeloo, The Netherlands\email{[email protected]}
\and
Anton Pannekoek Institute, University of Amsterdam,
Postbus 94249, 1090 GE Amsterdam, The Netherlands \email{[email protected]}
\and
Anton Pannekoek Institute, University of Amsterdam,
Postbus 94249, 1090 GE Amsterdam, The Netherlands \email{[email protected]}
}
%\author{P. Prasad \inst{1,2} \email{[email protected]}
% \and S.J. Wijnholds \inst{2}
% \and F. Huizinga \inst{1}
% \and R.A.M.J Wijers \inst{1}}
% \institute
% {Anton Pannekoek Institute, University of Amsterdam,
% Postbus 94249, 1090 GE Amsterdam, The Netherlands \label{1}
%\and
% ASTRON, The Netherlands Foundation for Radio Astronomy,
% PO Box 2, 7990 AA Dwingeloo, The Netherlands \label{2}
%}
\date{Received <date> / Accepted <date>}
\abstract{ The search for transient phenomena at low radio frequencies is now
coming of age with the development of radio sky monitors with a large field of view, which are
made feasible by new developments in calibration algorithms and computing.
However, accurate calibration of such arrays is challenging, especially within
the latency requirements of near real-time transient monitors, and is the main
cause of limiting their sensitivities. This paper describes a strategy for
real-time, wide-field direction dependent calibration of the Amsterdam-ASTRON
Radio Transients Facility and Analysis Center (AARTFAAC) array, which is a
sensitive, continuously available all-sky monitor based on the Low Frequency
Array (LOFAR). The monitor operates in a zenith pointing, snapshot imaging
mode for image plane detection of bright radio transients. We show that a
tracking calibration approach with solution propagation satisfies our latency,
computing, and calibration accuracy constraints. We characterize the
instrument and verify the calibration strategy under a variety of observing
conditions. This brings out several phenomena which can bias the calibration.
The real-time nature of the application further imposes strict latency and
computational constraints. We find that although ionosphere induced phase
errors present a major impediment to accurate calibration, these can be
corrected in the direction of the brightest few sources to significantly
improve image quality. Our real-time calibration pipeline implementation
processes a single spectral channel of a snapshot observation in $\sim$ 0.2
seconds on test hardware, which is well within its latency budget. Autonomously
calibrating and imaging one second snapshots, our approach leads to a typical
image noise of $\sim$ 10 Jy for a $\sim$ 90 kHz channel, reaching dynamic
ranges of $\sim$ 2000:1. We also show that difference imaging allows thermal
noise limited transient detection, despite the instrument being confusion
noise limited.}
\keywords{Instrumentation:Interferometers - telescopes - atmospheric effects - methods: observational}
\maketitle
\section{\label{sec:Introduction}Introduction}
The detection and characterization of low frequency radio transients is a Key
Science Project \citep{fender2006lofar} for the Low Frequency Array (LOFAR)
\textbf{\citep{vanhaarlem2013lofar}} radio telescope. In this context, the
Amsterdam-ASTRON Radio Transients Facility and Analysis Center
(AARTFAAC) \footnote{see www.aartfaac.org } has initiated building an All-Sky
Monitor (ASM) to survey most of the locally visible sky for transients and
variable sources. The ASM will be an image plane transient detector at low
radio frequencies with images generated via aperture synthesis. It will carry
out continuous, autonomous and near real-time sky monitoring for detecting the
brightest ($\sim$tens of Jy) transients occurring at a variety of cadences
(seconds to minutes). Its main aim is the rapid detection of low frequency (LF)
transients and the production of their rough position estimates for immediate
follow up at high sensitivity and resolution with the full LOFAR telescope. With
its very wide field of view, low guaranteed latency of calibration and imaging,
it will enable true, real-time all-sky monitoring of the low-frequency radio
sky. The AARTFAAC would be the most sensitive of the coming breed of LF Radio
Sky Monitors. Table \ref{tab:AARTFAAC_specs} compares various wide-field
instruments with transient searches as an explicit goal.\\
The discoveries of transients are currently biased toward objects emitting at
higher energies in the X-ray or $\gamma$-ray regime, primarily due to the
success of various satellite based ASMs operating at those energy levels. At
radio frequencies, searches for transients have usually been limited to mining
archives \citep{bower2007submillijansky, bower2011search}, follow-up studies of
discovered transients \citep{chandra2012radio}, and a few dedicated observing
programs \citep{bannister2012limits, katz2003survey}. However, the dynamic
nature of the sky at low radio frequencies has not been studied in detail yet,
mostly due to the restricted fields of view, and the low availability of
existing instruments for carrying out dedicated searches for transients. This
is set to change with the advent of a number of sensitive, wide field of view
instruments at the lowest frequencies most notably the LOFAR, the Murchison
Widefield Array (MWA) \citep{lonsdale2009murchison} and the Long Wavelength
Array (LWA) \citep{ellingson2009long}.
These instruments should be sensitive to a variety of phenomena, including
Pulsar giant pulses, bright radio flares from brown dwarfs and active stars,
emission from OH masers, Jovian bursts, and, most importantly, an unknown
population of bright bursters. Recent serendipitous discoveries of short bursts
of bright radio emission with unknown origin, and at relatively low radio
frequencies \citep{lorimer2007bright, thornton2013population} have shown the
potential variety of sources that might fill the unnaturally empty discovery
phase space of LF radio transients. Thus, the development of wide field
monitors, like AARTFAAC, is timely and crucial for detecting and characterizing
such sources. The science case for the AARTFAAC is detailed in
\mbox{\citep{wijers2014aartfaac}}.
\begin{table*}[tbhp]
\caption{Specifications of contemporary radio transient detection machines.}
\label{tab:AARTFAAC_specs}
\center{%
\begin{tabular}{c c c c c}
\hline \hline
Parameter & AARTFAAC LBA & MWA & LWA1 & Comment\\
\hline
Array elements & 288 inverted V antennas & 128 tiles & 256 wiregrid bowtie & Dual polarized elements\\
Frequency range (MHz) & 30-80 & 80-300 & 10-88 & \\
Field of view (sr) & $\pi$ & 0.06$\pi$ & $\pi$ & FWHM of beam\\
%% Effective area ($m^{2})$ & 10 & 21 & 2.5 & per element\\
Total Effective area ($m^{2})$ & 2617\tablefootmark{a} & 2752\tablefootmark{b} & 1393\tablefootmark{c} & \\
%% $T_{sys}$($\nu^{-2.55}$K) & $\sim2000$ & $\sim350$ & $\sim1500$ & \\
$T_{sys}$($\nu^{-2.55}$K) & ~3600 & ~350 & ~2100 & \\
Angular resolution (arcmin) & ~60 & ~3 & ~120 & \\
Spectral resolution (kHz) & 16 & 40 & 75 & \\
Processed Bandwidth (MHz) & 13 & 30.72 & 0.075 & LWA: Narrow band Imaging \\
Temporal resolution (sec) & 1 & 8 & 5 & \\
%% Transient detection FoM $(m^2sr K^{-1})$ & 2.3 & 1.3 & 0.830 & Per unit BW and unit time \\ \hline
Transient detection FoM\tablefootmark{d} $(m^2sr K^{-1})$ & 2.28 & 1.48 & 2.08 & Per unit BW and unit time \\ \hline
\end{tabular}}
\tablefoot{The parameters are estimated at the highest sensitivity of each
instrument, viz. 60 MHz for AARTFAAC, 150 MHz for the MWA, and 74 MHz for the
LWA, which observes continuously only in its 'Narrow band' mode. The zenith
pointing $A_{eff}$ is quoted. The $T_{sys}$ ( assumed to be sky noise dominated)
is also evaluated at the same frequencies from \citep{bregman2000concept}.
\tablefoottext{a}{From \citep{wijnholds2011situ}.}
\tablefoottext{b}{From \citep{ellingsonLWA1}.}
\tablefoottext{c}{From \citep{tingay2013murchison}.}
\tablefoottext{d}{See Sec. \ref{sec:The-AARTFAAC-All} for FoM definition}.}
\end{table*}
\textbf{Transient detection approaches:} A variety of approaches exist for the
detection of transient phenomena, depending on factors like the luminosity
distribution, spatial distribution, and location of sources (primarily affecting
dispersion smearing and scatter broadening), their timescales of variation,
emission mechanism, and the spatial and temporal behavior of background
noise. These include beam formed observations, deep imaging (staring), rapid
shallow imaging (tiling) etc.
Traditionally, image domain transient detection has been considered suitable
only for incoherent sources of emission, whose timescales of transience are
slow and whose brightness temperatures are expected to be <$10^{12}$K.
Coherent sources of emission have usually been detected using timeseries
analysis of beamformed data, although imaging can provide a higher spatial
resolution and better discrimination due to the coherent collection of power
into a single pixel (compared to incoherent beamforming) and a wider
field of view (compared to coherent beamforming). This dichotomy is mostly due
to the timescales of coherent emission, which are expected to be short from
light travel time arguments and the fact that beamforming can provide high
temporal resolutions and sensitivities, although over a reduced field of view.
Another promising alternative for detecting short term transients is the
bispectrum method of \citet{law2012all}. This uses interferometric closure
quantities from triplets of time differenced visibilities, which makes it
independent of instrumental phase errors. However, for an array with a large
number of elements and low SNR per baseline, the methods' absolute sensitivity
is lower than that of an imaging array. It is also sensitive to residual flux
after the subtraction of constant emission from visibilities. This can arise
due to changes in the visibility fringe over the subtraction period and imposes
an upper limit on the duration of candidate transients.
The usually sparse UV coverage in snapshot observations from imaging arrays
result in low instantaneous sensitivities and image dynamic ranges, mandating
long integration. This makes them unsuitable for short duration transient
detection. Another contributor to the lack of imaging detectors at short
timescales has been the time consuming step of calibration and imaging. Recent
arrays are being constructed using a large number of small, low sensitivity
elements. These provide a perfect base for all-sky monitors due to their very
good instantaneous UV coverage, high collective sensitivity and wide fields of
view. The challenge of real-time calibration and imaging from these instruments
is becoming feasible due to developments in high-speed calibration algorithms and
advances in computing resources. Thus, image plane detection of short
duration bright transients is now feasible. Further, for transients with an
isotropic spatial distribution, unknown duration, and luminosity distributions, a
tiling strategy of shallow but rapid observations would result in a larger
number of discovered transients \citep {nemiroff2003tile}. Imaging all-sky
monitors are hence matched for this application.
\textbf{Brief overview of main results:} A multisource, model sky based
self-calibration scheme has been found adequate for calibration of the full
field of view of the AARTFAAC array. Due to the received source power being
dominated by a few, very bright sources and the coarse array resolution,
a low-complexity point source sky model is adequate for calibration.
Observational constraints, especially due to the ionosphere, require the
calibration to be carried out in close to real-time for achieving the necessary
high imaging dynamic range. We have developed a calibration scheme capable of
handling rapid, direction dependent variations of system parameters, which
results in achieving close to thermal noise limited imaging. This is
demonstrated using test data taken under a variety of observational conditions.
The scheme has been incorporated into a calibration and imaging pipeline, and an
optimized implementation of the algorithm allows the instrument to carry out
near real-time calibration and imaging with high dynamic ranges of ~2000:1. To
verify that the proposed calibration scheme allows thermal noise limited
transient detection, we have analyzed the difference between consecutive
snapshot images for which the systematic confusion noise is expected to cancel
out. This analysis shows the expected reduction in noise being consistent with a
thermal noise limited observation. The achieved noise limit of difference images
is found to be ~2-3 Jy over tens of seconds.
This paper is organized as follows. We begin by describing the AARTFAAC array
and its suitability as a transient search machine in Section
\ref{sec:The-AARTFAAC-All}. We lay out the problem of wide-field calibration in
the context of transient detection in Section \ref{sec:Array-calibration-for}
while describing the approaches taken by similar instruments. We then give a
detailed description of our approach to calibration in Section
\ref{sec:An-Optimal,-tracking}, especially in the context of autonomous
operation. Section \ref{sec:Performance-of-tracking} presents the observed
performance of the calibration approach on commissioning data, while Section
\ref{sec:Computational-performance} elaborates on the computational performance
of our strategy. Section \ref{sec:Challenges-to-tracking} elaborates on some of
the challenges faced by the AARTFAAC ASM under real observing conditions after
which we present our conclusions. \textbf {The results presented in this paper
have been obtained on test observations carried out by using existing LOFAR
system infrastructure, while the AARTFAAC
Uniboard \footnote{http://www.radionet-eu.org/uniboard} based piggyback
recording system was being built.}
\section{\label{sec:The-AARTFAAC-All}The AARTFAAC All Sky Monitor System
overview}
\begin{figure*}[htbp]
\centering
\includegraphics[width=1\textwidth]{Figs/AFAAC_blkdia_latest.png}
\caption{AARTFAAC calibration and imaging pipeline within the full all-sky
monitor flow and leading onto the transient detection pipeline (TraP).}
\label{fig:The-AARTFAAC-calibration}
\end{figure*}
The AARTFAAC all-sky monitor is an aperture array of 288 sky-noise limited dual
polarized antennas (the Low Band Antenna or LBA), which are shared with the
LOFAR telescope. These operate between 30 and 80 MHz. They are organized as
six stations spread over $\sim$$300$ m, with each being a random array of 48
antennas which, can be spatially organized in one of a limited number of
configurations. The array shares its analog elements with the LOFAR telescope,
which thus controls the station subarray configuration. The received analog
signal after basic analog conditioning is baseband sampled at 200 MHz with a
12-bit quantization. All dipoles are sampled with a single clock, eliminating
differential delay errors between antennas due to such errors as clock
misalignment or drift. A hardware digital polyphase filter bank splits the
$\sim$$100$ MHz sampled band into $\sim$$192$kHz subbands. An 8-bit complex
representation of the subband timeseries has been found to be adequate to
maintain linearity in the presence of local RFI. A coupled data path routes a
configurable subset of subbands to the
Uniboard \footnote{http://www.radionet-eu.org/uniboard} based hardware FX
correlator. This makes the AARTFAAC a continuously available instrument,
independent of ongoing LOFAR observations. No delay compensation (apart from
the fixed cable delays) is carried out between antennas, resulting in a zenith
pointing PSF. The estimation of the resulting $\sim$$1.6e5$ instantaneous
visibilities makes this correlator the largest in the world in terms of
processed input streams. The I/O restrictions put an input limit of $\sim$$66$
subbands ($\sim$$13$ MHz) to the correlator, which produces visibilities at $16$
kHz and one second resolution. Note that the LOFAR also has a High Band Antenna
(HBA) component operating between 110 and 240 MHz with each element being a 4x4
tile equipped with an analog beamformer. This implies that data is available to
the AARTFAAC during HBA observations, which are mutually exclusive to LBA
observations. However, due to the limited field of view of $\sim$$20$ sq. deg,
and the arbitrary pointing of the analog beam of this system, its use is not
discussed further in this paper.
Table \ref{tab:AARTFAAC_specs} lists the current specifications of the
instrument and compares it with other low frequency wide field instruments with
transient detection as an explicit goal. Figure
\ref{fig:The-AARTFAAC-calibration} shows the functional components of the
AARTFAAC monitor with details of the near real-time transient detection
pipeline. The calibration component of the pipeline is the subject of this
paper.
\subsection{\label{sub:AARTFAAC-for-Transient}AARTFAAC for transient searches}
Temporally pulsed emission from a transient source interacts with an ionized
intervening medium and is distorted due to dispersion and scattering. These
effects can be parameterized by the medium's dispersion measure, the integrated
electron density along the line of sight (DM,$pc/cm^{-3}$). The DM is also used
as a proxy for distance. Dispersion causes an arrival time delay of the pulse at
different frequencies and leads to pulse broadening if the signal is not
dedispersed before spectral integration. However, this broadening can be
completely corrected if the DM of the source is known. Scattering is caused by
electron density fluctuations along the line of sight and leads to pulse
broadening due to arrival of delayed pulses via multiple paths. This effect,
however, cannot be corrected. Both effects are enhanced at large DMs and low
frequencies and can limit the detection of pulses, instead of the limitation
coming from the inherent luminosity and distance of the sources.
Since pulse attenuation is proportional to broadening, transient detectors
routinely increase the pulse detection sensitivity by carrying out trial DM
searches. However, the AARTFAAC does not carry out de-dispersion before
imaging. Thus, given a sensitivity threshold and a temporal resolution of
$\sim$0.1 to 1 second of the AARTFAAC, the transient sensitivity achieved via
dispersed spectral collapse limits the DM range of a detectable source, while
scatter broadening limits the DM range irrespective of spectral collapse.
An empirical relationship between the scatter broadening time due to the
interstellar medium and the DM has been derived by
\citet{bhat2004multifrequency}. This implies a DM upper limit of $\sim$100 at 60
MHz when lines of sight are within the Galaxy and when scatter broadening is
restricted to 1 second.
The temporal pulse broadening in microseconds over a bandwidth $\Delta\nu$ MHz
at $\nu$ GHz for a dispersion of DM units is given by Eq. \ref{eq:dm_broad}.
\begin{equation}
\Delta t_{DM}=8.3\,DM\,\Delta\nu_{MHz}\,\nu_{GHz}^{-3}\, \mu sec\label{eq:dm_broad}
\end{equation}
Imaging at the highest available spectral resolution of 16 kHz and restricting
dispersion broadening to within 1 second at the same time allows detection of a
source with a DM of up to $\sim$1600. This allows probing along any galactic
line of sight \citep{cordes2002ne2001}, although at a sensitivity a factor that
is $\sim$28 poorer than that with the full 13 MHz band.
%% Assuming all subbands are chosen to be contiguous around the peak instrumental
%% sensitivity while the dispersion broadening is limited to 1 second, the 13 MHz
%% continuum sensitivity of the AARTFAAC would limit detection of transients with
%% DMs of only a few. However, restricting dispersion smearing to \mbox{<1} second
%% under the upper limit of DM 100 imposed by scattering would allow a higher
%% spectral integration, before the sum of the two broadening processes exceed the
%% imaging cadence.
\textbf{The AARTFAAC imager does not carry out DM measure searches via
de-dispersion on trial DMs. Thus, attempts to increase the transient
detection sensitivity of AARTFAAC by spectral integration over its full 13 MHz
band would lead to a lowered detected SNR for any pulses with DMs greater
than a few. This is because dispersion broadening would spread the pulse
beyond the 1 second imaging cadence, restricting the transient search spatial
radius. However, as stated above, scattering along Galactic lines of sight
broadens pulses with DM ~100 to beyond 1 second. Thus, some level of spectral
integration can be afforded by this limit before scattering, and dispersion
broadens the pulse beyond the AARTFAAC cadence.} Finally, as shown by
\citet{hassall2013detecting}, de-dispersion is not beneficial for highly
scattered sources. The scatter broadening of the pulse increases more rapidly
with DM than the dispersive delay. At high DMs, this makes the inherent pulse
width (due to scatter broadening)larger than the dispersion broadening. This
would allow the AARTFAAC to probe the high DM domain with full spectral
sensitivity.
The ability to spread subbands over the full analog bandwidth allows us to
search for ultra steep spectrum sources and can aid in distinguishing between
terrestrial and celestial transient sources. The large spectral baseline also
help in carrying out image-based dedispersion in the future for enhancing the
transient detection sensitivity of AARTFAAC.
A figure of merit for transient detection \citep{cordes2004dynamic} from a
telescope is $A\Omega\left(\frac{T}{\Delta t}\right)$ and can be used for
comparison between instruments. Here, A is the total collecting area; $\Omega$
is the solid angle coverage; T is the total duration of observation; and $\Delta
t$ is the time resolution. Due to the limited duration of fast transients, it is
relevant to add an instantaneous sensitivity parameter to the figure of merit,
as represented by the system temperature $T_{sys}$. Large bandwidths increase
transient sensitivity only if de-dispersion with the correct DM value is carried
out. Since this requires a computationally expensive DM space search, we
consider a narrow band figure of merit. Assuming continuous availability and the
simultaneous imaging of the entire field of view, a per second figure of merit
is $A\Omega/T_{sys}$. Among currently planned ASMs, the AARTFAAC's FoM is
comparable to the LWA, which has similar field of view (see Table
\ref{tab:AARTFAAC_specs}). However, the AARTFAAC's higher spectral and temporal
resolution, as well as its larger processed bandwidth would give it a higher
sensitivity toward scatter broadened transients, as elaborated in Section
\ref{sub:AARTFAAC-for-Transient}.
\citet{backer1999pers} has shown that the signal-to-noise ratio achieved in a
continuous wide-field search scales with the array filling factor $f$ as
$\sqrt{f}$. Thus, the highly sampled aperture of the AARTFAAC dense array would
be an advantage for our application. The resulting zenith pointing PSF is stable
and repeatable in time. At its peak sensitivity at $\sim$$58$ MHz, the PSF has
high roll-off, low side lobes $\sim$$15$ dB below peak with a resolution of
$\sim$$0.8$ sq. deg. \textbf{Assuming the confusion limit to be reached with
the presence of one source per ten PSFs and the source counts from
\citet{bregman2012system}, results in a classical confusion noise of
$\sim$$10$ Jy.} The large number of antennas also make the AARTFAAC a very
sensitive instrument with a combined $A_{eff}/T_{sys}$ of $\sim$0.7 $m^{2}/K$
\citep{wijnholds2011situ} and an instantaneous thermal noise of $\sim$8 Jy for
the standard imaging mode of 1sec/16 kHz. This implies that the sensitivity of
typical snapshot images are limited by confusion noise and not thermal noise.
The array is 2-D to high accuracy ($\sim$1.4 cm rms in the z-axis); thus,
imaging the zenith region can be done via a simple \mbox{2-D} Fourier
transformation of the calibrated visibilities. Lines of sight away from the
phase center (the zenith) have a neglected phase term due to the w-component of
the observed visibilities. However, the co-planarity of the array results in
the spatial coherence sampling function that is confined to a plane passing
through the origin, keeping the 2-D relationship between the visibility and
imaging domains \citep{cornwell1992radio}. Thus, wide-field imaging is
simplified as no 3-D transforms or their approximations like W-projection
\textbf{\citep{cornwell2008noncoplanar}} are required. Simple faceting recovers
off-axis lines of sight with high fidelity, making latency bound imaging
feasible. The requirement of snapshot imaging implies that the sky observed by
every baseline remains constant within a visibility set, thus making the
calibration parameters amenable to estimation by self calibration. Since all
dipoles are physically aligned parallel to each other, the instrumental
polarization can be determined via a bi-scalar polarization calibration, and
corrections can be applied in the image domain.
Dedicated hardware is used to achieve low latencies of transient detection.
These include a hardware correlator based on the Uniboards for estimating the
visibilities in real-time, and a software solution running on general purpose
hardware for the calibration, imaging, and transient detection pipelines. Thus,
the AARTFAAC array is well suited for its role as an all-sky monitor.
\section{\label{sec:Array-calibration-for}All-Sky calibration}
Calibrating a radio array telescope entails estimating the instrumental and
(possibly environmental) contribution to observed visibilities. These can be
parameterized partially by per antenna complex gains and noise. Observations of
sources with accurate models allow the estimation of these parameters and can
enhance the sensitivity of the instrument substantially
\citep{taylor1999synthesis}. An advantage of all-sky instruments is the
availability of enough bright sources within the beam for in-beam calibration,
making dedicated observations of calibrator sources unnecessary.
Calibration of the full field of view (i.e. beyond the half power beam width)
is usually necessary for accurate estimation of the flux contributed by bright
sources to any pointing of the synthesized beam via its far sidelobes, aiding in
their accurate deconvolution. A wide-field image plane transient detector
typically searches image timeseries for transients by extracting and analyzing
light curves of existing sources, or by detecting new sources referenced to a
database of lightcurves. The Transient Detection pipeline (TraP)
\citep{swinbank2014trap} component of the AARTFAAC ASM carries out source
extraction from individual time slices via thresholding and fitting \mbox{2D}
Gaussian models to regions of emission. Hence, high point-source sensitivity
and accurate flux recovery across the full field of view is a fundamental
requirement of calibration for transient searches, while a slight error in
source positions can be tolerated by the pipeline via spatial source
association. The flux estimation of any source via imaging directly depends on
the flux calibration of the instantaneous visibilities, which in turn depends on
a proper division of the uncalibrated flux on a visibility between element gain,
system noise, and source flux. Due to the dominance of emission from our own
Galaxy on system temperatures, the system noise can vary by almost $40\%$,
depending on the pointing of the array. Thus, system gain and temperature need
to be continuously estimated via calibration.
An important requirement for real-time transient detection is a hard deadline on
calibration time and a limited computational budget in view of the large number
of parameters to be estimated. These dictate quick and timebound convergence of
the calibration parameter estimators. Further, the streaming nature of the
application and the large number of visibilities makes their buffering or
multiple passes of processing unfeasible.
Finally, the calibration should be robust against sources of terrestrial
transients due to, for example, Radio Frequency Interference (RFI), which can
cause the algorithm to converge to a sub-optimal solution. However, the most
dominant of these effects is due to the ionosphere, which is discussed next.
\begin{figure*}[tbh]
\centering
\includegraphics[width=0.7\textwidth]{Figs/Fig2_blkdiag.png}
\caption{Block diagram depicting the snapshot
iterative calibration control flow in the AARTFAAC optimal calibration
scheme. }
\label{fig:Block-diagram-depicting}
\end{figure*}
\subsection{\label{sub:All-Sky-cal-iono}Ionospheric effects}
The antenna complex gain has contributions primarily from the gains of the
electronics, receiver characteristics, and telescope geometry. These usually vary
slowly ($\sim$hours), are direction independent effects (DIEs), and are estimated
via observation of calibration sources or using self-calibration. At low
frequencies, the disturbed ionosphere can act as a phase screen with temporally
and spatially varying refractive and diffractive effects. Ionization of the
ionosphere during the day by the Solar wind and photoionization is balanced by
recombination during the night. These can cause bulk variations
$\left(\sim10x\right)$ in large scale Total Electron Content (TEC) with slow
temporal variations, as well as fluctuations on relatively small temporal and
spatial scales ($\sim0.1\%$ variations over a few kilometers and over tens of
secs). If the rapid TEC fluctuation sets up an instantaneous spatial phase
gradient across the array in the direction of a source, an apparent position
shift of the source is seen. However, if the phase structure function varies
from a gradient, a deformation of the source structure may result due to
defocusing, resulting in a reduction of the recovered source peak flux.
Since the arrival time delay per antenna depends on the TEC along the line of
sight to the source, these are termed direction dependent effects (DDEs). A
phase correction varying over the field of view then needs to be applied, and a
single phase correction per antenna (as obtained by traditional self
calibration) is insufficient. Uncalibrated phase errors cause scattering of
source power into sidelobes, affecting the reliability of the extracted
lightcurves. Further, a change in the apparent source shape leads to an increase
in residual sidelobes after deconvolution, as the mean source model deviates
from the apparent instantaneous sky, and the source subtraction is
incomplete. These residual sidelobes increase the background noise level and
can introduce spurious structure into the image.
During DDE parameter estimation, we make the simplification that the effects are
identical for all antennas. This is a reasonable assumption for a compact
array, whose size projected to ionospheric heights are expected to be smaller
than the typical isoplanatic patch. Thus, identical lines of sight from
individual antennas are expected to traverse an ionospheric patch with the same
refractive properties. The estimation of a complex gain in the direction of each
source is required, but this can be assumed to be identical for all
antennas. Thus, a multisource, model-based calibration approach is appropriate
for the calibration of wide-field, compact arrays
\citep{wijnholds2010calibration}.
Although instrumental parameters are expected to vary on longer timescales
(hours to days for LOFAR), their precise calibration also mandates temporal
oversampling. If uncorrected, these effects can raise the image noise floor and
contribute to variations in the recovered flux of sources, leading to false
positives. Thus, real-time calibration of both DIEs and DDEs is necessary for
maximizing transient detection sensitivity of autonomously operating, near
real-time instruments.
\subsection{Current approaches to all-sky calibration}
Typical calibration schemes, such as those implemented in the CASA package,
address a different problem than what is applicable to the AARTFAAC due to the
restricted field of view, much longer baselines, and an order of magnitude fewer
stations in typical arrays. \textbf{Their algorithms are further complicated by
the need to compensate for higher order effects like the temporal variation of
the primary beam during long synthesis due to changing array geometry, or the
beam rotation of altaz mounts, etc., which are moot in our application.}
Snapshot, zenith pointing imaging from a co-planar array simplifies the
calibration and imaging from the ASM to a certain extent.
A successful approach to wide-field calibration is the Peeling algorithm
\citep{noordam2004peel,vdTol2007selfcallofar}, in which self-calibration toward
sources within the field of view is carried out in decreasing order of their
brightnes, with removal of the brightest remaining source's calibrated
contribution to all visibilities. This source is selected via rephasing the
array to its direction, and the contribution of other sources is attenuated by
averaging over their unphased visibility contribution (fringe washing). Thus, a
single source calibration approach is adequate, and a least squares estimation
of the antenna gains in the direction of the source can be carried out using one
of several methods \citep{boonstra2003gain}. The solution yields a set of
time-variable, antenna-based phase corrections per source, and a source model.
However, the algorithm requires the storage of the estimated visibilities with
multiple calibration and imaging passes through the data before the iterative
peeling can be concluded and calibrated images produced. This, along with the
increased computational load, makes it unsuitable for real-time operation. Other
contemporary instruments with similar specifications and goals like ours use
mostly Peeling based approaches.
The MWA \citep{lonsdale2009murchison}, located in Western Australia, has
developed an algorithm for carrying out real-time, full polarization direction-
dependent calibration of snapshots of $\sim$8 seconds via a Peeling mechanism
\citep{mitchell2008real}. They use the sequential deconvolution of several
bright sources in decreasing order of apparent flux to iteratively fit
apparent angular offsets induced by ionospheric phase shifts and antenna gains
toward these sources. This is suitable for the much reduced field of view of
the MWA as compared to the AARTFAAC, allowing them to fit a ``rubber sheet''
model of the ionosphere over their field of view. The main departure of our
approach to theirs is in the estimation of image wander and the deconvolution
of sources affected by the ionosphere. The sequential nature of peeling ensures
that the sidelobe contamination of the brighter source does not affect the flux
measurement of the weaker source and hence, its deconvolution. In our case, the
apparent fluxes of the brightest sources are simultaneously estimated, and their
effects subtracted together. This is efficient computationally and is
aided by the filled nature of the AARTFAAC UV plane, which results in low
sidelobe contamination. Further, the ionospheric effect is estimated by fitting
a phase ramp across the available bandwidth in the MWA, which requires
synchronization between the spectrally separated calibration threads. Our
estimation uses a Direction of Arrival (DoA) algorithm independently for each
spectral channel, and does not require large bandwidths for fitting phase ramps.
This allows a loosely coupled parallel architecture for our implementation. The
AARTFAAC calibration has a stricter latency bound, and its lowered sensitivity
and better PSF reduce the benefits of an iterative deconvolution.
The LWA \citep{ellingsonLWA1} is co-located with the VLA in New Mexico
(USA). Along with forming beams in real-time (its primary mode of operation), it
can also operate in an 'All-sky' mode for a single tuning of 70 kHz. The
calibration of antenna phases utilizes the method of fringe rate filtering using
narrow band data to localize one of multiple point source calibrators within the
field of view. Here, the time-varying phases of visibilities due to contribution
by discrete sources is converted into a fringe rate spectrum by taking a Fourier
transform of the correlation, where the sources are apparent as localized
components. The fringe of the brightest source is filtered, and antenna delays
extracted by fitting a model of the presumed delay response to the measured
phase response. Such an approach provides a phase calibration solution in the
unique direction of the brightest source. However, fitting a fringe requires an
extended period of time to generate the fit baseline, which is not suitable for
our streaming, real-time application. Further, given the calibration approach,
the presence of a disturbed ionosphere would add a random noise on the parameter
estimates, while any bias due to ionospheric systematics would probably be
averaged out over the time period over which the fringe is fitted. This could
lead to a bias in the snapshot calibrated visibilities.
Field-based calibration \citep{cottona2004beyond} is another technique for
direction dependent ionospheric phase calibration, and was developed for the VLA
74 MHz observations. Over a time interval of 1-2 minutes, it measures and
converts the apparent position shifts of 5-10 detectable bright sources within
the field of view into ionospheric phase gradients over the array. Subsequently,
an independent phase screen (based on a 5-term basis of Zernike polynomials) is
fitted onto the observations, and is used to predict phase gradients in
arbitrary viewing directions to image the full field of view. Such a technique
is applicable to a limited field of view of a high sensitivity system, which
implies the presence of bright sources close enough to interpolate the phases
attributed to the ionosphere. The AARTFAAC wide field of view and lower
sensitivity preclude the interpolation between the widely spaced phase
calibrator sources. This implies that sources in locations intermediate to
model sources may be affected by ionospheric amplitude and position variations,
which result in the presence of structured variations in a lightcurve for such
sources. % , as can be seen in Figure \ref{fig:Light-curves-of}.
\section{\label{sec:An-Optimal,-tracking}An Optimal tracking calibration
scheme for transient detection}
Here, we present our approach for latency bound, precise calibration of the
AARTFAAC with a low computational footprint. We use a model-sky based,
multi-source self calibration approach \citep{wijnholds2009multisource}.
Calibration of an array of identical, wide-field antennas entails deriving the
direction dependent response of every antenna, each of which is excited by
multiple, simultaneously present calibration sources. The system noise
contribution is also estimated, and subtracted while calibrating the
visibilities.\\ \textbf{Algorithmic Summary:} As seen in Figure
\ref{fig:Block-diagram-depicting}, the calibration of the system for each
incoming time and frequency slice is carried out iteratively in two parts: a
Major cycle which carries out calibration of direction dependent effects, and a
Minor cycle which carries out calibration of direction independent effects.
\begin {enumerate}
\item {The input to the algorithm is a running timeseries of measured spatial
correlations between all antennas (visibilities organized into an Array
Covariance Matrix (ACM)) for a given time and frequency slice, and the
corresponding instantaneous sky-model.}
\item {The Minor cycle within each Major cycle iteratively estimates the complex
gains of all antennas using the StEFCal
\citep{salvini2014stef,salvini2014stefursi} algorithm. This is done by
iteratively fitting a parameterized model to the observed visibilities, with
the model itself being generated by the encompassing Major cycle.}
\item {The Major cycle then estimates the direction dependent effects (modeled
via the apparent flux and positions of model sources) and system noise using
the latest antenna gains, and updates the model with these higher accuracy
parameters.}
\item {The time axis is used to feed forward parameter estimates as an initial
guess for the next timeslice, leading to faster convergence.}
\item {The frequency axis is compensated for the known spectral response of the
dipoles during bandpass calibration, allowing spectral averaging of the
calibrated visibilities. Finally, an appropriate flux scale is provided by
scaling the recovered flux of a few model sources to their actual, known
fluxes.}
\end{enumerate}
In the following, we first describe the calibration of an ACM
corresponding to a single timeslice, termed 'Instantaneous calibration'. The
latency and computational constraints for real-time calibration suggest
utilizing the available time axis for rapid convergence. This is implemented in
the tracking component of our algorithm, which implements a temporal
feed-forward of filtered solutions as initial estimates. It may be noted that
our calibration algorithm is limited to operating in the visibility domain, and
does not use the image domain to determine source structure, e.g., via CLEAN
components. This is beneficial for a streaming calibration approach.
Note that since the telescope gains are frequency dependent, the received band
is divided into multiple channels, and the parameter estimation is carried out
separately per channel. A fundamental assumption is that the bandwidth over
which the ACM is formed is narrow enough for phase rotations to compensate for
temporal delays between the reception of the signal at different antennas
\citep{zatman1998narrow}. This is appropriate as the maximum time of flight on
the longest baseline of 300 m (\textasciitilde{}1 $\mu s$) is much less than
the inverse of the typical calibration channel bandwidth of $16$ kHz.
\subsection{Instantaneous calibration}
Array calibration can be formulated as a non-linear parameter estimation
problem, which can be solved using statistically efficient estimators generated
via a Non-linear Least Squares approach. Our approach to calibrating a single
incoming timeslice closely follows that of \citet{wijnholds2009multisource},
which establishes asymptotically efficient estimators for the model parameters
via a Maximum-Likelihood (ML) formulation. Given a set of $p$ antennas whose
locations are known precisely and $q$ calibration sources with nominally known
positions and fluxes within the field of view, the data model developed for the
instantaneous ACM $\mathbf{R}$ in their scheme is given by:
\begin{equation}
\mathbf{R=GAG_{0}\Sigma_{s}G_{0}^{H}A^{H}G^{H}+\Sigma_{n}}\label{eq:datamodel}
\end{equation}
where \textbf{$\mathbf{G=}diag(\left[g_{1},\ldots,g_{p}\right])$ }is the
diagonal matrix of DIE gain of each antenna, $\mathbf{A}$ is the matrix of array
steering vectors, generated using the known positions of the array antennas,
$\mathbf{G_{0}=}diag(\left[g_{01},\ldots,g_{0q}\right])$ is the diagonal matrix
of DDE gain in the direction of each of the $q$ sources,
$\mathbf{\Sigma_{s}}=diag\left(\left[\sigma_{s1}^{2},\ldots,\sigma_{sq}^{2}\right]\right)$
is the known flux of the sources in the sky model, and $\mathbf{\Sigma_{n}}$ is
the diagonal noise covariance matrix assuming an uncorrelated, but non-identical
system noise contribution from each antenna.
The model parameters to solve for are of the form:
\begin{equation}
\bm{\theta}=[\gamma_{1},\ldots\gamma_{p},\phi_{2}...,\phi_{p,}\sigma_{s1}^{2},...\sigma_{sq}^{2},\mathbf{l_{1}}^{T},...\mathbf{l_{q}}^{T},\sigma_{n1},...,\sigma_{np}],\label{eq:estparam}
\end{equation}
where $\mathbf{\gamma_{i}}$ is the direction independent gain of each antenna
and $\phi_{i}$ is the associated phase. $\sigma_{si}$ and $\mathbf{l_i}^{T}$
are the estimated fluxes and positions of the model sources, while
$\sigma_{ni}$ is the system noise, assumed to be independent for each antenna.
Since all signals are assumed to be independent, identically distributed
Gaussian random variables, the Normal Equations for this estimation problem are
generated by minimizing the negative log-likelihood function:
\begin{equation}
\bm{\hat{\theta}}=argmin\left(ln|\bm{R(\theta)}|+tr(\mathbf{R}^{-1}(\bm{\theta})\mathbf{\widehat{R}})\right)\label{eq:normeq}
\end{equation}
where $\bm{R(\theta)}$ is the model covariance matrix as a
function of the parameters $\bm{\theta}$, and $\mathbf{\widehat{R}}$ is
the sample covariance matrix.
Due to the difficulty in solving this minimization problem in closed form, a
numerical optimization based on a weighted least squares covariance matching
estimation technique (COMET) is utilized \citep{ottersten1998covariance}. This
is known to lead to estimates that are equivalent to ML estimates for a large
number of samples, thus being asymptotically efficient and reaching the
theoretical limit of the error on the estimator, the Cramer-Rao lower bound
(CRLB).
The estimation of the instantaneous calibration parameters is carried out by
partitioning the parameters into subsets, which are then estimated using a Least
Squares approach. This approach of alternating between parameter subsets using
the best current estimate of a subset in an iteration to estimate the other
subsets of parameters is called Weighted Alternating Least Squares (WALS).
\subsubsection{\label{sub:Model-generation}Model generation}
\begin{table*}[tbh]
\caption{Details of model sources (the A-team) used for All-sky self-calibration}
\label{tab:Details-of-model}
\center{%
\begin{tabular}{c c c c c}
\hline \hline
Src & $S_{60}(Jy)$ & 74 MHz Size & \% Flux contribution & Comment \\
\hline
3C461 (CasA) & 19605.31 & 7' & $\sim$50 & Spectra from (1), Decay from (2)\\
3C405 (CygA) & 19201.65 & 4.5' & $\sim$42 & Spectra from (1)\\
3C144 (TauA) & 2417.31 & 8' & $\sim$11 & Spectra from (1)\\
3C274 (VirA) & 1656.46 & 14' & $\sim$8& Spectra from (2)\\
\hline
\end{tabular}}
\tablebib{
(1)\citet{baars1977absolute}; (2)\citet{helmboldt2008radio}
}
\tablefoot{ $S_{60}$ has been generated using the spectral indices of
\citet{helmboldt2008radio}, while a secular decrease in the flux of CasA of
0.8\% has been assumed. The fractional flux contribution of each model source
to the flux in the observed snapshot visibilities assumes the flux of
unmodeled sources adds incoherently due to a random sky distribution, along
with a source density of $\sim66 sr^{-1}$ at 178 MHz.}
\end{table*}
Forming the normal equations of Eq. \ref{eq:normeq} for minimization requires
modeling the observed visibilities using the data model in
Eq. \ref{eq:datamodel} and the current estimates of the parameters. Due to the
limited resolution of the array, most of the brightest objects (apart from the
Galactic plane) are unresolved by the AARTFAAC. Thus, the sky can be modeled by
a collection of points at the nominal locations of the bright sources. We use a
sky model composed of the brightest sources in the \textbf{Northern} sky, viz.,
CasA, CygA, VirA, TauA and the Sun, whose nominal positions are determined from
the revised third Cambridge (revised) catalog (3CR). The model parameters used
are summarized in Table \ref{tab:Details-of-model}. The efficacy of this model
for parameter estimation is elaborated upon using real data in Section
\ref{sec:calib-accuracy}. Of these model sources, CasA is visible throughout
the year from the location of the AARTFAAC.
Galactic emission, having a steep spectrum, is extremely bright at LOFAR
frequencies and also difficult to model due to the detailed structure resolvable
at the AARTFAAC's resolution and sensitivity. Hence, we filter out the low
spatial frequencies to suppress this emission during calibration. The model can
then account for a large fraction of the received flux on the filtered
visibilities, and is constrained by the fluxes and positions of the model
sources, as well as the noise model.
The model building requires an estimate of the actual instantaneous flux
$\left(\mathbf{\Sigma_{s}}\right)$ of the model sources, along with the current
estimate of the direction independent gain solutions and the noise. Typically,
an accurate sky model provides the model fluxes as well. However, significant
flux variation of the model sources can be introduced by the ionosphere over the
AARTFAAC array as well as by the direction dependent gain. Hence, estimating
the model source fluxes via an efficient estimator results in the generation of
a consistent sky model. Section \ref{sub:Direction-dependent-gain} summarizes
this approach. Note that a relative flux stability is more relevant for a
transient detection instrument, and can be achieved to a higher accuracy, than an
absolute flux extraction.
A COMET based estimator for the noise covariance has been shown to be well
suited if a linearly parameterized model of the noise covariance matrix is used
for this problem \citep{ottersten1998covariance}. However, antennas in a crowded
array like the AARTFAAC can mutually couple with each other, resulting in
coloring of the noise. Our noise model also includes such effects, and is
discussed in more detail in Section \ref{sub:System-noise-estimation}.
\begin{comment}
Values of A-team and galactic plane contribution is based on actual
contribution to visibilities in night time data (for CasA/CygA and Galaxy), and
day time data for VirA,TauA and the Sun. The total power of calibrated
visibilities = sum(abs(acccalgal(:)).^2), where acccalgal = (gainsol' *
gainsol) .* acc; The Galactic contribution = sum (abs(sigman(:)).^2), but also
includes the autocorrs, which is a sum of Tsys and Tsky, and which cannot be
separated without external measurements of Tsys. This explains the high value
of galactic contribution, against an expected 40% contribution. The RAteam
contribution is estimated by generating model visibilities from fluxes
estimated by LSimaging, ie, the apparent flux, and so is elevation dependent.
NOTE that we dont have observations in which all Ateam sources are at high
elevations, in which case we multiply their visibility contribution by the
approximate beam attenuation. SNR was removed from the table, as it does not
provide very much extra information as compared to the total flux contribution
from a source.
\end{comment}
\subsubsection{\label{sub:Direction-independent-gain}Direction independent gain
estimation (Minor Cycle)}
Once an appropriate model for the observed visibilities has been created,
direction independent gains can be estimated using an appropriate estimator. The
AARTFAAC calibration is latency bound, hence we implement the StEFCal
\citep{salvini2014stef,salvini2014stefursi} algorithm for gain estimation. This
algorithm has a smaller memory footprint, and its computing scales as
$\mathcal{O}(N^{2})$ for N parameters, as against the $\mathcal{O}(N^{3})$
scaling of traditional solvers. This significantly reduces the computing during
AARTFAAC calibration due to the large number of parameters ($\sim$$590$) being
estimated. The StEFCal implementation led to a measured increase in calibration
throughput of a factor $\sim$30 \citep{salvini2014stef}, compared to a
traditional estimator, and makes real-time calibration of every time and
frequency slice feasible. This speed gain is primarily due to linearizing the
cost function, allowing the solution to be computed analytically and hence
avoiding the need for matrix inversions. These, although computationally
costly, are essential to other solvers like the Levenberg-Marquardt minimizer.
StEFCal algorithm has been shown to be unbiased with rapid convergence.
\textbf{Gain Constraints:} Since we simultaneously solve for apparent source
fluxes as well as antenna gain amplitudes, a constraint on either the source
fluxes or the gain amplitudes are needed. However, the variability of model
source fluxes due to ionospheric scintillation prevents their use to constrain
the self-calibration. Doing so couples the estimated gain solutions to
variability in the model fluxes, thus transferring the scintillation to
calibrated visibilities, and hence over the entire field of view. To break this
coupling, we instead use a constraint on the average gain amplitude over all
antennas, setting it to unity. This reflects the behaviour of antenna gain
amplitudes, which were observed to be stable to a few percent across all
antennas and over long times during commissioning. The phases are referenced to
the first antenna in the array as an additional constraint. These constraints
guide the traversal of the $\chi^{2}$ error surface towards an identifiable
global minimum, whose convergence is identified by a slow enough rate of change
of the estimated parameters.
\subsubsection{\label{sub:Direction-dependent-gain}Direction dependent gain estimation (Major Cycle)}
The major cycle creates an updated model sky using the higher accuracy parameter
estimates from the minor cycle. It uses this for estimating direction dependent
effects, parameterized in the apparent fluxes and positions of the model
sources. \textbf{The cycle begins with a one-time estimation of the model source
positions via the WSF algorithm.}
\textbf{Pre-calibration model source position estimation:}The tracking
calibration approach also incorporates a Direction of Arrival (DoA) algorithm
using a vector subspace technique called Weighted Subspace Fitting (WSF)
\citep{viberg1991detection}. This allows us to estimate the instantaneous
position of a model source, thus compensating for the image wander of the
sources due to ionospheric refraction. The WSF is an algorithm for determining
the directions of multiple narrow-band, far-field emitters whose uncorrelated
signals are received by an arbitrary (but known) array geometry. It is a high
resolution algorithm, with a resolution better than $\lambda/D$ (D being the
array size) possible for sources with a high SNR. It operates by partitioning
the received ACM into a signal and a noise subspace based on its
eigen-structure. It then confines the signal subspace corresponding to the true
signal parameters to the subspace spanned by the array manifold vectors, which
represent the functional dependence of the array response vector to a source
over the region of interest in parameter space. Then, the signal parameters are
estimated by finding the best least-squares fit of the two subspaces. A crucial
assumption is that the array manifold is known, implying that the array is
calibrated. To satisfy this requirement, our approach generates initial
calibration solutions based on the catalog positions of the model sources,
calibrates the array and then carries out a WSF estimation.
%% An example of estimation with the WSF on test
%% observations, and its spatial resolution is presented in Figure
%% \ref{fig:Estimated-flux-of}.
\begin{table*}[tbh]
\caption{Flux ratios of bright sources within snapshot from Obs. 3.}
\label{tab:Flux-ratios-of-1}
\center{%
\begin{tabular}{c c c c c c c c}
\hline \hline
Source & $S_{60}$ & $\sigma_{S_{60}}$ & Calibrated & $\sigma$ & Ratio & Comment\\
& (Jy) &(Jy) & flux (Jy) & (Jy) & & \\ %\tabularnewline
\hline
3C10 & 367.9 & 18.81 & 397.02 & 67 & 1.08 & VLSS $N_g$=4, $\alpha$=-0.7\\
3C452 & 152.2 & 10.99 & 184.52 & 28 & 1.21 & VLSS $N_g$=2, $\alpha$=-0.7\\
3C390.3 & 99 & 6.00 & 121.89 & 35 & 1.23 & VLSS $N_g$=3, $\alpha$=-0.7\\
3C380 & 156.2 & 2.99 & 156.2 & 38 & 1 & \citep{scaife2012broad}\\
3C295 & 134.5 & 8.31 & 95.23 & 37 & 0.71 & \citep{scaife2012broad}\\
%% 3C405 & 19202 & & 26927 & 78 & 1.402 & Kassim et. al.\tabularnewline
%% \hline
%% 3C461 & 16145 & & 31758 & 89 & 1.967 & Kassim et. al.\tabularnewline
\hline
\end{tabular}}
\tablefoot{The $S_{60}$ flux has been derived from the best available modeled
spectra, or -0.7 otherwise. $N_g$ is the number of Gaussian components in the
source. The calibrated flux ratio is derived after imaging the calibrated
visibilities and generating light-curves of peak flux from sources in the
snapshots.}
\end{table*}
\textbf{Bias of the WSF estimator:} The requirement for the majority of flux in
the ACM to be contributed by the model sources implies that the algorithm can
produce biased solutions in the presence of unmodeled flux. Tests of WSF show
that spatial filtering of diffuse emission is adequate to prevent this biasing.
Thus, WSF along with LS imaging allows us to accommodate the effect of the
ionosphere into the model visibilities, leading to lower modeling errors, and
hence better estimates of the calibration parameters. Calibrating the data then
requires applying the DIE solutions to the incoming data, while the DDEs are
corrected in the image plane via a beam model which incorporates the effects.
\textbf{Model source flux estimation:} As explained in Section
\ref{sub:Model-generation}, instantaneous estimates of the apparent
(deconvolved) model source flux are required for model generation. This can be
framed as a parameter estimation problem, for which a closed form estimator
based on the COMET approach has been developed in
\citep{wijnholds2008fundamental} in an approach called Least Squares Imaging.
Here, the array configuration is assumed known to a high accuracy, while the
number of sources requiring flux estimation is assumed to be smaller than the
number of resolution elements in the field of view. This approach allows the
deconvolved flux of a model source to be estimated, due to the incorporation of
a deconvolution operator as part of the estimator.
%% Figure \ref{fig:Estimated-flux-of} shows the extracted flux of the brightest
%% visible model sources, and clearly shows the effect of the element beam and
%% ionospheric scintillation.
The model source flux estimator uses a sparse weighting matrix
due to the modeling of mutual coupling via a non-diagonal noise matrix (Section
\ref{sub:System-noise-estimation}), which prevents a bias in estimation.
\subsubsection{\label{sub:System-noise-estimation}System noise estimation in the
presence of Galactic emission and antenna mutual coupling}
Both Galactic emission and coupling between closely spaced antennas can cause
correlated noise on the visibility formed from a pair of antennas. Mutual
coupling due to the antennas being placed closer than half a wavelength at the
lower frequencies can result in fluctuation of the PSF gain and sidelobe levels
as a function of pointing direction \citep{agrawal1972mutual}. This implies
that antenna pattern multiplication (assuming that a single element of an array
behaves similarly to it being isolated) may not apply. Mutual coupling is a
short baseline effect, and can be ignored between the antennas of the different
stations making up the AARTFAAC. The impact of mutual coupling to the antenna
primary beam in the typical LBA\_OUTER mode of observation is expected to be
$<-17dB$ from simulations \citep{wijnholds2011situ}.
The very bright synchrotron background of the Galactic plane at low frequencies
also poses problems. Firstly, the total system noise temperature being dominated
by Galactic emission also leads to correlated noise between antennas. This, in
turn, again leads to poorer sensitivity of the PSF formed by including these
baselines as a function of pointing direction and away from the zenith compared
to the sensitivity expected after pattern multiplication, as found by
\citet{ellingson2011sensitivity}. They also found that the effect of the
Galactic correlated noise dominates that due to mutual coupling, and is a