diff --git a/doc/papers/2011/europar/coherent-dedispersion.jgr b/doc/papers/2011/europar/coherent-dedispersion.jgr index 0910dbb41567d92c7615a96026c30860452f3f22..926f5383799adc26a475fa7748a8ab966c9a276e 100644 --- a/doc/papers/2011/europar/coherent-dedispersion.jgr +++ b/doc/papers/2011/europar/coherent-dedispersion.jgr @@ -1,4 +1,5 @@ newgraph + clip xaxis min 0 max 2 @@ -21,11 +22,11 @@ newgraph hash_label at 2 : 3.76 yaxis - min 0 max 2 nodraw + size 1.2 legend - x 0.5 y 1.2 + x 0.5 y 1.1 newline label : No channel-level dedispersion @@ -34,15 +35,16 @@ newline color 0 0 1 pts shell : N=0;for i in \ - 0.02011669 0.00507009 -0.00771127 0.02275786 -0.13795437 0.01486767\ - 0.04283439 0.18166798 0.20039363 0.43340311 0.61501703 0.80407534\ - 0.83333333 0.75695429 0.69960432 0.66769064 0.65099889 0.45159893\ - 0.43001391 0.30665736 0.12644565 0.01286941 0.084529\ - 0.02011669 0.00507009 -0.00771127 0.02275786 -0.13795437 0.01486767\ - 0.04283439 0.18166798 0.20039363 0.43340311 0.61501703 0.80407534\ - 0.83333333 0.75695429 0.69960432 0.66769064 0.65099889 0.45159893\ - 0.43001391 0.30665736 0.12644565 0.01286941 0.084529 0.02011669;\ - do echo $N / 23 | bc -l; echo "($i + 0.13795437)/(0.83333333 + 0.13795437)" | bc -l; N=$(($N+1)); done + 0.08720009 0.00767691 0.05785112 -0.01541911 0.00221603 -0.00673315\ + 0.01460056 -0.09792603 0.00907605 0.02865762 0.12586534 0.13897656\ + 0.30212383 0.42928525 0.56165903 0.58214473 0.52866608 0.4885111\ + 0.46616596 0.45447882 0.31486408 0.2997508 0.21337971\ + 0.08720009 0.00767691 0.05785112 -0.01541911 0.00221603 -0.00673315\ + 0.01460056 -0.09792603 0.00907605 0.02865762 0.12586534 0.13897656\ + 0.30212383 0.42928525 0.56165903 0.58214473 0.52866608 0.4885111\ + 0.46616596 0.45447882 0.31486408 0.2997508 0.21337971\ + 0.08720009;\ + do echo $N / 23 | bc -l; echo "$i" | bc -l; N=$(($N+1)); done newline label : Channel-level dedispersion @@ -52,13 +54,13 @@ newline pts pts shell : N=0;for i in \ - 0.01427185 -0.05419144 0.0065101 0.06195318 -0.07190334 -0.00771236\ - -0.05202656 -0.04786229 0.01148896 0.39690428 0.71437241 0.83333333\ - 0.62925924 0.49068521 0.41371978 0.49633274 0.53869321 0.46915986\ - 0.23657243 0.14340703 0.06047267 0.01298272 -0.06736764\ - 0.01427185 -0.05419144 0.0065101 0.06195318 -0.07190334 -0.00771236\ - -0.05202656 -0.04786229 0.01148896 0.39690428 0.71437241 0.83333333\ - 0.62925924 0.49068521 0.41371978 0.49633274 0.53869321 0.46915986\ - 0.23657243 0.14340703 0.06047267 0.01298272 -0.06736764 0.01427185;\ - do echo $N / 23 | bc -l; echo "($i + 0.07190334)/(0.83333333 + 0.07190334)" | bc -l; N=$(($N+1)); done - + 0.0774172 0.03210746 -0.0445541 0.00610412 -0.0319828 0.02593199\ + 0.07882975 -0.04888158 0.01236247 -0.02991732 -0.02594422 0.03068228\ + 0.39840362 0.70129715 0.81479671 0.62009142 0.48787918 0.41444714\ + 0.49326743 0.53368318 0.46734203 0.24543242 0.15654414\ + 0.0774172 0.03210746 -0.0445541 0.00610412 -0.0319828 0.02593199\ + 0.07882975 -0.04888158 0.01236247 -0.02991732 -0.02594422 0.03068228\ + 0.39840362 0.70129715 0.81479671 0.62009142 0.48787918 0.41444714\ + 0.49326743 0.53368318 0.46734203 0.24543242 0.15654414\ + 0.0774172;\ + do echo $N / 23 | bc -l; echo "$i" | bc -l; N=$(($N+1)); done diff --git a/doc/papers/2011/europar/lofar.pdf b/doc/papers/2011/europar/lofar.pdf index 5fbe7f74773c85286300e84f1be6ee92e3fb79d1..f18f8ff6e0a00f87bd7537526a1a683f8379f801 100644 Binary files a/doc/papers/2011/europar/lofar.pdf and b/doc/papers/2011/europar/lofar.pdf differ diff --git a/doc/papers/2011/europar/lofar.tex b/doc/papers/2011/europar/lofar.tex index 0a35f84d62dd645c8b5e559c00f3aa57b63b2d53..7cb899fa0922840211f7ad1968ea0826ce481913 100644 --- a/doc/papers/2011/europar/lofar.tex +++ b/doc/papers/2011/europar/lofar.tex @@ -74,8 +74,6 @@ LOFAR imaging pipeline \cite{Romein:10a} \section{LOFAR} \label{Sec:LOFAR} -The LOFAR telescope consists of many thousands of simple dipole antennas (see Figure \ref{fig:lbafield}), grouped in \emph{stations}. The stations are strategically placed, with 20 stations acting as its center (the \emph{core}) and 24 stations at increasing distances from that core (see Figure \ref{fig:map}). A core station can act as two individual stations in some observational modes. Every station collects and combines the signals from its antennas, and sends the resulting data stream to our IBM BlueGene/P (BG/P) supercomputer at our central processing facility. The BG/P combines the data streams from one or more stations and reduces the resulting stream in size sufficiently to be able to store it on disks in our storage cluster. Both the stations and the BG/P perform hard-real-time signal processing. Once the data has been stored on disk, off-line processing takes over. The off-line processing transforms and further reduces the data produced by the BG/P into data products such as images or time series, and are made available to the astronomer(s) that requested the observation. - \begin{figure}[ht] \subfigure[A field with low-band antennas (dipoles).]{ \makebox[35mm][c]{ @@ -100,6 +98,8 @@ The LOFAR telescope consists of many thousands of simple dipole antennas (see Fi \caption{LOFAR antennas} \end{figure} +The LOFAR telescope consists of many thousands of simple dipole antennas (see Figure \ref{fig:lbafield}), grouped in \emph{stations}. The stations are strategically placed, with 20 stations acting as its center (the \emph{core}) and 24 stations at increasing distances from that core (see Figure \ref{fig:map}). A core station can act as two individual stations in some observational modes. Every station collects and combines the signals from its antennas, and sends the resulting data stream to our IBM BlueGene/P (BG/P) supercomputer at our central processing facility. The BG/P combines the data streams from one or more stations and reduces the resulting stream in size sufficiently to be able to store it on disks in our storage cluster. Both the stations and the BG/P perform hard-real-time signal processing. Once the data has been stored on disk, off-line processing takes over. The off-line processing transforms and further reduces the data produced by the BG/P into data products such as images or time series, and are made available to the astronomer(s) that requested the observation. + The antennas are omnidirectional and have no moving parts. Instead, all telescope functions are performed electronically through signal processing done at the stations and on the BG/P. The telescope can be aimed because the speed of light is finite: the light emitted by a source will arrive at different antennas at different times (see Figure \ref{fig:delay}). By adding appropriate delays to the signals from individual antennas before accumulating them, the signals from the source will be amplified with respect to signals from other directions. Once the samples from all antennas are combined, the data are transmitted to the BG/P, which uses the same technique to combine the data from the individual stations. The latter will be explained further in Section \ref{Sec:Beamforming}. A LOFAR station is able to produce 248 frequency subbands of 195~kHz out of the sensitivity range of 80~MHz to 250~MHz. Each sample consists of two complex 16-bit integers, representing the amplitude and phase of the X and Y polarizations of the antennas. The resulting data stream from a station is a 3.1~Gb/s UDP stream. @@ -136,7 +136,7 @@ The BG/P contains several networks. A fast \emph{3-dimensional torus\/} connects \label{fig:ion-processing} \end{minipage} \hfill -\begin{minipage}[t]{0.3\textwidth} +\begin{minipage}[t]{0.4\textwidth} \center \includegraphics[width=0.8\textwidth]{pencilbeams.pdf} \caption{Tied-array beams (hexagons) formed within a station beam (ellipse).} @@ -213,14 +213,14 @@ The beamformer transforms chunks representing station data into chunks represent Another major component in the pulsar-observation pipeline is real-time dedispersion. Since light of a high frequency travels faster through the interstellar medium than light of a lower frequency, the arrival time of a pulse differs for different wave lengths. To combine data from multiple frequency channels, the channels must be aligned (shifted in time). Otherwise, the pulse will be smeared or even overlap with the next pulse, causing many details to be lost. This process, called \emph{dedispersion}, is done by post-processing software that runs after the observation has finished. However, to observe at the lowest frequencies, or to observe fast-rotating millisecond pulsars, dedispersion must also be performed \emph{within\/} a channel, since our channels (typically 12~KHz) are too wide to ignore dispersion. -Dedispersion is performed in the frequency domain, effectively by doing a 4K~Fourier transform (FFT) that splits a 12~KHz channel into 3~Hz subchannels. The phases of the observed samples are corrected by applying a Chirp function~\cite{...}, i.e., by multiplication with precomputed, subchannel-dependent, complex weights. These multiplications are programmed in assembly, to reduce the computational costs. A backward FFT is done to revert to 12~KHz channels. - \begin{figure}[ht] \includegraphics[width=0.5\textwidth]{coherent-dedispersion.pdf} \label{fig:dedispersion-result} -\caption{Pulse profiles of pulsar J0034-0534, with and without dedispersion applied at channel level.} +\caption{Pulse profiles of pulsar J0034-0534, with and without channel-level dedispersion.} \end{figure} +Dedispersion is performed in the frequency domain, effectively by doing a 4K~Fourier transform (FFT) that splits a 12~KHz channel into 3~Hz subchannels. The phases of the observed samples are corrected by applying a Chirp function~\cite{...}, i.e., by multiplication with precomputed, subchannel-dependent, complex weights. These multiplications are programmed in assembly, to reduce the computational costs. A backward FFT is done to revert to 12~KHz channels. + Figure~\ref{fig:dedispersion-result} shows the effectiveness of channel-level dedispersion, where we observed pulsar J0034-0534 with a pulse period of 1.88~ms. By applying dedispersion, the effective time resolution is improved from 0.51~ms to 0.082~ms, revealing a narrower, more detailed pulse and a better signal-to-noise ratio. Dedispersion thus contributes significantly to the data quality, but it also comes at a significant computational cost due to the two FFTs it requires. It demonstrates the power of using a \emph{software\/} telescope: the pipeline component was implemented, verified, and optimized in only one month time. \subsection{Second All-to-all Exchange}