Dual-domain joint learning reconstruction method (JLRM) combined with physical process for spectral computed tomography

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 51,779 characters · extracted from preprint-html · click to expand
Dual-domain joint learning reconstruction method (JLRM) combined with physical process for spectral computed tomography | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Dual-domain joint learning reconstruction method (JLRM) combined with physical process for spectral computed tomography Genwei Ma , Xing Zhao doi: https://doi.org/10.1101/2024.01.22.24301600 Genwei Ma 1 Academy for multidisciplinary studies, Captial Normal University , West third ring road, Beijing, 100048, Beijing, China 3 Beijing Higher Institution Engineering Research Center of Testing and Imaging ,West third ring road, Beijing, 100048, Beijing, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Xing Zhao 2 School of Mathematical Sciences, Captial Normal University , West third ring road, Beijing, 100048, Beijing, China 3 Beijing Higher Institution Engineering Research Center of Testing and Imaging ,West third ring road, Beijing, 100048, Beijing, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: zhaoxing_1999{at}126.com Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Spectral computed tomography (SCT) is an powerful imaging modality with broad applications and advantages such as contrast enhancement, artifact reduction, and material differentiation. The positive process or data collected process of SCT is a nonlinear physical process existing scatter and noise, which make it is an extremely ill-posed inverse problem in mathematics. In this paper, we propose a dual-domain iterative network combining a joint learning reconstruction method (JLRM) with a physical process. Specifically, a physical module network is constructed according to the SCT physical process to accurately describe this forward process, which makes the nonlinear use of the traditional mathematical iterative algorithm effective and stable. Additionally, we build a residualto-residual strategy with an attention mechanism to overcome the slow speed of the traditional mathematical iterative algorithm. We have verified the feasibility of the method through our winning submission to the AAPM DL-spectral CT challenge, and demonstrated that high-accuracy also basis material decomposition results can be achieved with noisy data. 1 Introduction Spectral computed tomography (SCT) is popular and promising in clinical and industrial nondestructive testing. Traditional CT aims to accurately recover a detailed internal image of an object by scanning it from different angles. However, it does not consider the polychromaticity of x-rays. SCT, as shown in Fig. 1 , considers the beam spectrum is broad and the polychromatic nature of the x-ray beam makes quantitative imaging. Considering the x-ray spectral information, this leads to more complex reconstruction problems. Hence, in SCT, an object is scanned with different x-ray spectra or spectral separations from the broad spectrum to supplement the information. Spectral x-ray data collection methods include kVp-switching [ 1 ], dual-source scanning [ 2 ], dual-layer detection, simplistic two-pass scanning, and photon counting detectors [ 3 , 4 ]. Generally, the collected data of SCT, also known as polychromatic projection data, are utilized to perform energyand material-selective reconstructions [5– 8]. In other words, SCT not only can distinguish materials better but allows quantification of the mass density of two or more materials in a tissue or a mixture with known elemental composition [ 9 ]. Download figure Open in new tab Fig. 1. Spectral computed tomography imaging process. In mathematics, the SCT reconstruction problem can be seen as solving for µ ( x, E ) from K sets of polychromatic projection data under different spectra or spectral separation, where is the linear attenuation coefficient of the scanned object at point with energy E and S k ( E ), k = 1, 2.is normalized effective spectrum, ∫ S k ( E ) dE = 1 and ϵ k represent scatter or noise of the k th projection. In SCT, the linear attenuation coefficient is generally decomposed as a linear combination of some predefined basis functions, where θ i ( E ) are energy-dependent functions, and are functions of spatial position. There are two physical explanations for this equation. The first one is the decomposition method based on the physical effect, where M = 2 in this case and the functions based on the photoelectric effect and Compton scattering.The second explanation is basis material decomposition. θ i ( E ), represent the mass attenuation coefficients of the selected basis materials. The reconstructed , represent the densities of the basis materials of the scanned object. Substituting (2) into (1), we can obtain the discrete form of SCT as follow: where R i,k , k = 1, 2, K , represents the k th Radon transform. Compared with traditional CT, the reconstruction problem of SCT is nonlinear and ill-posed. Moreover, real projection data may be inconsistent. Algorithms to solve this problem can be classified in two ways. According to the domain where the data are processed, the methods can be divided into image domain methods [ 8 – 14 ] and projection domain methods [ 15 , 16 ]. They can also be categorized into direct mapping methods [ 5 , 10 – 15 , 17 – 19 ], iterative algorithms [ 16 , 20 – 31 ], and deep-learning methods [ 32 – 40 ]. Several researchers combine these classifications. Image domain methods, also known as post-processing methods, directly process images that have been reconstructed from collected raw data. The reconstructed image is generally solved using a linear algorithm, such as the algebra reconstruction technique (ART) or filter back-projection (FBP). This is actually a first-order approximation of the original nonlinear data, although image domain methods use different basis functions [ 10 , 11 , 15 , 18 ] to approximate it. Hence, the reconstructed images still suffer from artifacts such as beam-hardening. Projection domain methods process either raw or log-transformed data before image reconstruction. Theoretically, projection domain methods can obtain better images than image domain methods, because they can compensate for nonlinear effects on material decomposition and suppress artifacts in the decomposition process. However, polychromatic projections require geometric consistency, and it is notoriously difficult to practical SCT system. Direct mapping constructs a basis function and establishes a mapping between the SCT data and basis material. While direct mapping methods are quick and simple and do not consider the spectrum information and attenuation coefficient of materials, they are highly dependent on the calibration phantom, which limits the accuracy of the reconstructed images. Iteration reconstruction algorithms are the most effective way to solve ill-posed nonlinear inverse problems. Unfortunately, they are time-consuming when the geometric parameters of different spectral scans are inconsistent. Many researchers combine the statistical assumptions of raw data and prior information on images, but this involves hyperparameters that can only be adjusted empirically and do not offer consistent image quality improvement [ 41 ]. sourcedual-detector CT systems [ 42 , 43 ]. In recent years, deep learning methods have obtained high-quality reconstructed images with complete training samples. However, much training data are required to train the network-trainable parameters, and it is difficult to obtain in many cases. Sidky et al . lead to the AAPM challenge named DL-spectral CT. This challenge provides an opportunity for investigators in SCT image reconstruction, using data-driven or iterative techniques, to compete with their colleagues on the accuracy of their methodology for solving the inverse problem associated with spectral CT acquisition from incomplete, noiseless measurements. a This study aims to demonstrate whether deep neural networks can realize high-precision decomposition images of basis materials and establish a foundation for SCT reconstruction algorithms based on big data and deep learning [ 41 ]. We propose an iterative network method that fuses SCT physical processes and traditional mathematical algorithms. Although the AAMP challenge provides accurate physical processes (including spectrum and attenuation coefficient information), our method describes the physical process and relevant physical quantities as learnable network parameters, which is more flexible. As with DL-sparse-view CT, high reconstruction accuracy is only possible if the forward model is explicitly incorporated into the solution map, e.g., by an iterative promotion of data-consistency [ 44 ]. Here, we also build physical process into precise physical module, which can realize the accurate expression of the positive process in iterative steps, so as to realize the residual transmission correctly. For the noisy case, we add regularization terms, which is more practical. The main contributions of our work are as follows: The proposed method is based on the complementary advantages of physical processing, traditional mathematical iteration algorithms (TMIAs), and deep learning. Physical processing realizes the accurate expression of physical phenomena, TMIAs robustly achieve domain transformation, and deep learning can accurately materials decomposition. A network joint physical model governs SCT projection data generation. Hence, the network can more accurately express the SCT physical process. Only when the physical process can be accurately and adequately described by one model can the iterative process continuously improve reconstruction accuracy. The physical model of SCT is defined as a module of the network whose x-ray spectra S k ( E ) and attenuation coefficient θ ( E ) correspond to the learnable parameters. In the iteration process, the input/label data of networks use residual-toresidual to train the network model, rather than image-to-image or imageto-residual. Because places with large errors are observable in the residual image, it is difficult to distinguish them in the image. Moreover, residual-toresidual builds into the residual attention mechanism. Attention operations in residual images make network training easier. The network structure is combined with practical problems. The SCT projection data and reconstructed image are domain-related, but even in inconsistent projections, the associated region is relatively small. Therefore, CNN can apply SCT, but the receptive field should not be generous, so as to avoid phenomena such as overfitting and poor robustness. 2 Method 2.1 JLRM architecture We formulate SCT reconstruction as a nonlinear optimization problem to solve basis material images from acquired polychromatic projections : where corresponds to the nonlinear SCT physical process, and ℛ 1 and ℛ 2 are network regularization terms in the projection and image domains, respectively, which are used for the case of existing noise or scattering. In this way, ℛ 1 can more accurately describe the physical model for the noise or scattering case. ℛ 2 can effectively suppress noise or scattering and obtain better reconstructed images. In our experiments, the traditional mathematical iteration algorithm (TMIA) uses the SART algorithm during iteration process and the other TMIA also support. The third step is worth noting. We first calculate the projection residuals for reconstruction, and the results are input to the CNN to obtain the residuals of the base material images. That is, we use the residual-to-residual strategy for network training, which can more effectively improve the image quality. Generally, the initial value also has a pronounced influence on the convergence speed of the iterative algorithm. Therefore, we incorporate a pre-decomposition module before the iterative process. Our SCI network includes a pre-decomposition module and an iteration process, as shown in Fig. 2 . The pre-decomposition module includes TMIA and CNN steps. For TMIA, we use the E-ART method, which is not sensitive to spectral information, and the quality of reconstructed images is higher than with other analytic algorithms. For the iterative process, the three steps of the incremental method are consistent. As mentioned above, we use a residualto-residual strategy for effective network training. An attention mechanism is incorporated before the residual image input CNN, for easy network training and quick convergence. Below we show pseudocode for the training stage (Algorithm 1) and test stage (Algorithm 2). Download figure Open in new tab Fig. 2. Architecture of proposed method, including pre-decomposition module and iteration process. Algorithm 1 Training stage Download figure Open in new tab The proposed method is based on the complementary advantages of physical processing, TMIAs, and deep learning. Physical processing realizes the accurate expression of physical phenomena, while TMIAs achieve domain transformation, and deep learning can accurately materials decomposition. The three parts are interdependent and complementary. Algorithm 2 test stage Download figure Open in new tab 2.2.1 Physical module for nonlinear physical process Only when the physical process can be accurately described by the model can the iterative reconstruction process continuously improve reconstruction accuracy. Here, to accurately describe the nonlinear physical process of SCT, its positive process is equivalently mapped into a network module. As shown in Fig. 3 , Firstly, do a Radon transform for three basis material. This can be achieved by a projection layer [ 45 , 46 ]. Here, we have overridden the interface which projection and back-projection operators are provide by official. Next, the module can be constructed according to the discrete polychromatic projection formula, where the spectral information and attenuation coefficient can be set as corresponding learning parameters. In fact, both sets of learnable parameters can be achieved by a convolution operator. For the attenuation coefficient, this layer can set K convolution kernels, of size N k × M × 1 × 1 ( out channels × in channels × height × width ). For spectral information, the size of K convolution kernels is 1 × N k × 1 × 1. For the noise case, a regularization term network should be added in the physical module to more accurately express the physical process. Download figure Open in new tab Fig. 3. Physical process equivalent mapping physical module. 2.1.2 CNN network structure design The network structure is also critical to the reconstruction result, because our network is trained block-to-block. Once overfitting occurs, the results of subsequent iterations are disastrous. The CNNs of pre-decomposition and iterative processes are basically similar, with structures as displayed in Fig. 4 . The biggest difference between them is the channel setting of input data, in which the channel of CNN 1 is set to 2, while that of CNN 2 is 6. The CNN contains eight blocks, each with three convolution layers, and the kernel sizes are 3×3, 1×1, and 3×3. It is worth noting that network operations such as downsampling, upsampling, and transpose convolution, which make the receptive field large, cannot be used. Although the projection is inconsistent and the pixels of basis material images are domain-related, the regional correlation caused by the inconsistency is very small, and increasing the receptive field will aggravate overfitting, which is fatal for later iterations to obtain more accurate decomposition results. Download figure Open in new tab Fig. 4. CNN network structure with eight blocks, each with three convolution layers. 2.1.3 Residual-to-residual strategy The residual-to-residual strategy proposed based on experiments observations which can effectively improve the accuracy of reconstruction. As shown in Fig. 5 , regions with large errors can be directly located in the residual image, where it is difficult to find in reconstructed images. Hence, the image-to-residual strategy may bring new errors, with many uncertainties to improve the quality of reconstructed images. In other words, image-to-residual is unstable for improving image quality. Download figure Open in new tab Fig. 5. Residual-to-residual vs. image-to-residual strategy. Residual-to-residual strategy makes it easier to locate where there are large errors. The ReLU activation function is often used in the network, which makes the images obtained by the network nonnegative. The residual image does not possess this property. To use the nonlinear ReLU activation function, we decompose the residual image dx into the form where dx + and dx − are, respectively, the positive and negative parts of the residual image. Thus, the network output becomes an image with two nonnegative channels. 2.1.4 Residual attention mechanism Generally speaking, in reconstructed residual images, even if the decomposition is correct, there are still some errors, and this phenomenon occurs at the edges of basis material images. This can be overcome by incorporating an attention mechanism 47–49] to emphasize the edges, which can make the network training more simple and efficient. Attention includes both channel and spatial attention. In our case, we need to emphasize edges that are spatial features, so spatial attention is employed. Given a tensor of intermediate feature map η ∈ R c×h×w , spatial attention generates a spatial attention map A ∈ R 1 ×h×w by utilizing the inter-spatial relationships of features. Then the output of the attention mechanism, , can be expressed as where ⊙ denotes element-wise multiplication and c is the channels of input data. During multiplication, the attention values are broadcast (copied) to all feature maps along the channel dimension. The spatial attention focusing on “where” is the most informative part. Considering that there are three materials, we implement the attention mechanism in three directions. As shown in Fig. 6 , our attention mechanism consists of three pipelines to construct three spatial attention maps. Given a two-dimensional feature map Download figure Open in new tab Fig. 6. Residual attention mechanism. f ∈ R h×w , which is obtained by applying the weighting transform on three basis material images, let us define where a 1 , b 1 and a 2 , b 2 represent the weight parameters and bias in the 1×1 convolutional layer, and sigmoid denotes the sigmoid activation function. Here, we set the initial values as a i = 1, i = 1, 2, 3, and b i = 0, i = 1, 2, 3. To apply the attention mechanism, each residual image element-wise multiply spatial attention maps and obtained feature maps would have been re-weighted, which is helpful to accelerate the convergence of the network. 2.2 Network training The proposed method was implemented using Python under the PyTorch framework. Each module was trained module-by-module, and the network was optimized using the Adam optimization method with a min-batch of nine image patches for each iteration. The objective function for each module used an MSE loss function, where x, y ∗ are the input/label data, and Θ denotes the network learnable parameters. The complete training samples were randomly shuffled, and as an empirical stopping criterion of each module, the number of training epochs was set to 1000. Comparative experiments were performed on a PC (AMD EPYCRome processor, 128 GB RAM). Training was executed on a single graphic processing Nvidia RTX A6000 with 48 GB of video memory. 3 Results Experiments were carried out to demonstrate the behavior of the proposed method, including architecture validation, for example, residual analysis and the performance of JLRM in noise suppression, reconstruction method, CNN network structure design and residual-to-residual strategy. 3.1 DL-spectral CT setup of AAPM challenge This challenge focuses on spectral CT, where the object is scanned by X-rays with two spectra, i.e., K = 2, without noise. This challenge model an ideal form of fast kVp-switching where the X-ray tube voltage alternates between two settings for consecutive projections. For each kVp setting, the beam spectrum is broad and the polychromatic nature of the X-ray beam makes quantitative imaging in CT quite challenging when only one kVp setting is used. Scanned objects are simulated for a breast model [ 50 ] that contains three tissue types ( M = 3): adipose, fibroglandular, and calcification. Truth images and simulated data are provided for 1000 cases so that participants can decide to use either a data-driven or optimization-based technique. The SCT imaging process can be seen in Fig. 7 , which shows the spectral information used in the imaging process and the linear attenuation coefficient of the material. It can be observed that the linear attenuation coefficients of the two materials are very close. This is a tricky point, as discussed in the experimental results. To be fair, the test dataset adopts 10 additional cases, which are provided in a “starting kit” with ground-truth images. The fan-beam geometric parameters of the SCT system are listed in Table 1 . The DL-spectral-CT challenge seeks the image reconstruction algorithm that provides the most accurate reconstruction of the adipose, fibroglandular, and calcification spatial maps from SCT projection data. Details about the challenge setup and results can be found on the official website. b View this table: View inline View popup Download powerpoint Table 1. System and geometric scanning parameters of AAPM DL-spectral CT challenge dataset Download figure Open in new tab Fig. 7. SCT imaging, where forward process is data collection, which is also a physical process. Inverse process is reconstruction, i.e., basis material decomposition. 3.2 Performance and analysis of JLRM We demonstrate that JLRM can be trained to accurately reconstruct basis material images from collected projection data obtained from the DL-spectral CT of the AAPM challenge. As described in section 2 , the JLRM method includes a pre-decomposition module and two iteration of the iteration process. Fig. 8 shows the basis material images of these three modules. It is difficult to visually distinguish the image quality reconstructed by each module. The last row indicates the tissue label map of the three materials, from which we can clearly see the proportion of each material in each pixel. Fig. 9 shows the different images. The accuracy of the proposed method can be further improved, and the sequence module can continuously improve the accuracy of reconstruction based on comparison with the differential images of each module. Even in the display window with almost mechanical accuracy, the difference images of the final result (2 iterations) are difficult to indicate a large error. This can verify that our method can achieve near exact reconstruction. Table 2 shows the average RMSE for quantitative evaluation, which further indicates that our method can obtain accurate reconstruction. The accuracy of the results finally submitted in the AAPM challenge is 6.8×10 − 7 . Report to the second place accuracy of 6.21 ×10 − 6 , our reconstruction accuracy is higher one order of magnitude. View this table: View inline View popup Download powerpoint Table 2. Average RMSE for quantitative evaluation. Download figure Open in new tab Fig. 8. Left to right: ground truth, results of pre-decomposition block, iteration process with 1 and 2 iterations. Display windows: [0.15, 0.35] for adipose material, [0.3, 0.7] for fibroglandular material, [0.1, 0.5] for calcification material. Last row: tissue label map with adipose (blue), fibroglandular (green), calcification (red). Download figure Open in new tab Fig. 9. Left to right: ground truth, difference images of pre-decomposition block, iteration process with 1 and 2 iterations. Display windows of difference images are [-0.00005, 0.00005]. To better understand the behavior of each module of the proposed method, Fig. 10 shows the loss function update curve of each material of each module. In the pre-decomposition module, adipose and fibroglandular material cannot reach the mechanical accuracy, but more cases of calcification material can reach the mechanical accuracy. In the iteration process, the accuracy can be well improved using the residual-to-residual strategy. Download figure Open in new tab Fig. 10. Update curves of three material loss functions. Left to right: adipose, fibroglandular, and calcification material. 3.3 Residual analysis Because the projection data of the AAPM challenge are noise-free, a crucial way of a proper solver for this DL spectral-CT problem is evaluating this difference images , which should be as low as possible. We analyze this aspect in Fig. 11 . For better analysis and observation, we reconstructed the residual images from the residual of projection. Fig. 12 displays the reconstructed residual images. We note that the residual images in the image domain also showed a decreasing trend. The results of the final iteration showed that each pixel of the residual was all within the mechanical accuracy. Download figure Open in new tab Fig. 11. Errors of projection domain for each module. Download figure Open in new tab Fig. 12. Errors of image domain for each module. Colored boxes mark trend of updates during iterative process; corresponding zoomed-in views are displayed in left corner. Some pixels with small residuals, marked by red boxes in Fig. 12 , cannot be updated effectively in the first iteration, and are shown to be more obvious in the residual image after one iteration, which facilitates further performance improvement. Some regions with large errors can continuously shrink during the iteration process, although updates still have larger errors, as marked by blue boxes. 3.4 Performance of JLRM in noise suppression To ensure universality, we study the noise data. The statistics of x-ray measurements are often described using a Poisson distribution to model the incident intensity, where I noisy,k and q k denote received intensity of detectors and noise-free projection data, respectively. The noisy projection data . Table 3 lists the accuracy of the proposed method under different noise levels. As shown in previous experimental results, the phenomenon of adipose and fibroglandular materials is also consistent, mainly because the attenuation coefficients of the two materials are very similar. Hence, the two materials are easily decomposed incorrectly, and their performance evaluation indices are basically consistent. The attenuation coefficient of calcification material is large, and its size is very small; hence, calcification material can still have mechanical accuracy with high noise levels ( I 0 = 1 × 10 5 ) and can do so quickly when the noise level is relatively low ( I 0 = 1 × 10 6 ). View this table: View inline View popup Download powerpoint Table 3. Average RMSE of dataset with different noise levels for quantitative evaluation. To further understand the effect of noise on the decomposition results of adipose and fibroglandular materials, we analyze a set of results obtained from noise-free pre-decomposition. As in the residual analysis of section 3.3 , the obtained projection domain residuals are reconstructed to obtain the results shown in Fig. 13 , where the projection residuals are obtained by performing the physical process with the pre-decomposition results minus the noisy projections, i.e., . Fig. 13 shows that it is too difficult to reflect some decomposition errors in the image when the noise is relatively large, such as those marked in the red box (zoomed-in view is shown in upper-right corner). However, in some locations where the error is smaller, the noise is small but also difficult to decompose, while the noise-free case can be obviously found, such as in the blue box (zoomed-in view shown in upper-left corner). Download figure Open in new tab Fig. 13. Residual images with different noise levels. Colored boxes mark details of images under different noise levels; corresponding zoomed-in views are displayed in upper corners. 3.5 Receptive field: small or large? As argued in CNN network structure design of section 2 increasing the receptive field will aggravate the overfitting phenomenon, which is fatal for the later iteration to obtain more accurate decomposition results. Fig. 14 shows the loss function curve update of the pre-decomposition module. During the training process of the proposed CNN, the changes of the training and test sets are essentially the same with the iterative update. For UNet, using pooling and upsampling layers causes the network to have a large receptive field. However, the experimental results show that adipose and fibroglandular materials display an obvious overfitting phenomenon after a period of training. Download figure Open in new tab Fig. 14. Update curves of three material loss functions for pre-decomposition module with networks with different receptive fields. Fig. 15 shows the performance of overfitting in the reconstructed image of adipose material, where fibroglandular material has the same phenomenon. The training set has higher accuracy for UNet, and the error in the difference image is quite small, while the test set has a significantly larger error. Download figure Open in new tab Fig. 15. Results of reconstruction of training and test sets using a larger receptive field. Display windows: [0, 1 ] for material images, and [-0.05,0.05] for difference images. 3.6 Residual-to-residual vs. image-to-residual We research the mapping strategy. Fig. 16 displays the partial results of two iterations of the image-to-residual and residual-to-residual mapping strategies for adipose and fibroglandular materials. The image-to-residual mapping strategy may bring new reconstruction errors, so that the accuracy of the final reconstruction cannot be really improved, and there exists the risk of instability. Due to the places with large errors are difficult to distinguish them in the reconstruction images. The residual-to-residual strategy can effectively improve the accuracy compared with the image-to-residual strategy. The highprecision reconstruction results can be attributed to the following: 1) It can calculate the residual in combination with the physical module; 2) The attention mechanism is used to reduce the complexity of network decomposition; 3) The residual-to-residual strategy avoids large numbers eating decimals. Download figure Open in new tab Fig. 16. Results of residual-to-residual and image-to-residual mapping strategies. Display windows: [0, 1 ] for material images and [-0.05,0.05] for different images. 4 Discussion To solve the problem of high-precision base material decomposition in spectral CT, this paper proposes an algorithm fused on a physical model, traditional mathematical iterative algorithm, and deep learning. Each part has clear functions and is built based on given problems and actual situations. The physical module, which is embedded and expressed as a network structure, can accurately describe the physical process of SCT imaging. The mathematical iterative algorithm realizes information transfer between domains. These three modules complement each other. We introduce some network skills or strategies in some modules, which are observations related to SCT problems, and can improve the reconstruction results. Examples are a residual attention mechanism and the study of the receptive field. To further illustrate the effectiveness of our method, we study it when the data are noisy. The JLRM algorithm is based on deep learning, which mixes mathematics and physics. It can obtain satisfactory decomposition results due to a large number of training datasets. In practice, it is difficult to obtain a large volume of SCT projection data, and it requires matching label data (basis material images). The current energy spectrum is based on the data generated under a single specific energy spectrum. However, the spectral curves of the actual scanning system under the same energy are not necessarily consistent. Data Availability All data produced are available online at https://dl-sparse-view-ct-challenge.eastus.cloudapp.azure.com/competitions/3#learn_the_details Acknowledgments This work was supported by the National Natural Science Foundation of China (No. 61827809) and the National Key Research and Development Program of China (No. 2020YFA0712200). The authors are grateful to the Beijing Higher Institution Engineering Research Center of Testing and Imaging and the Beijing Advanced Innovation Center for Imaging Technology for funding this research work. Footnotes ↵ a https://dl-sparse-view-ct-challenge.eastus.cloudapp.azure.com/competitions/3 ↵ b https://dl-sparse-view-ct-challenge.eastus.cloudapp.azure.com/competitions/3#learn_the_details References [1]. ↵ Xu , D. , Langan , D.A. , Wu , X. , Pack , J.D. , Benson , T.M. , Tkaczky , J.E. , Schmitz , A.M. : Dual energy ct via fast kvp switching spectrum estimation . In: Medical Imaging 2009: Physics of Medical Imaging , vol. 7258 , pp. 1198 – 1207 ( 2009 ). SPIE OpenUrl [2]. ↵ Petersilka , M. , Bruder , H. , Krauss , B. , Stierstorfer , K. , Flohr , T.G. : Technical principles of dual source ct . European journal of radiology 68 ( 3 ), 362 – 368 ( 2008 ) OpenUrl CrossRef PubMed [3]. ↵ Leng , S. , Bruesewitz , M. , Tao , S. , Rajendran , K. , Halaweish , A.F. , Campeau , N.G. , Fletcher , J.G. , McCollough , C.H. : Photon-counting detector ct: System design and clinical applications of an emerging technology . Radiographics 39 ( 3 ), 729 – 743 ( 2019 ). doi: 10.1148/rg.2019180115 OpenUrl CrossRef PubMed [4]. ↵ Willemink , M.J. , Persson , M. , Pourmorteza , A. , Pelc , N.J. , Fleischmann , D. : Photon-counting ct: Technical principles and clinical prospects . Radiology 289 ( 2 ), 293 – 312 ( 2018 ). doi: 10.1148/radiol.2018172656 OpenUrl CrossRef PubMed [5]. ↵ Alvarez , R.E. , Macovski , A. : Energy-selective reconstructions in x-ray computerised tomography . Physics in Medicine and Biology 21 ( 5 ), 733 ( 1976 ) OpenUrl CrossRef PubMed Web of Science [6]. Alvarez , R. , Seppi , E. : A comparison of noise and dose in conventional and energy selective computed tomography . IEEE Transactions on Nuclear Science 26 ( 2 ), 2853 – 2856 ( 1979 ) OpenUrl CrossRef [7]. Alvarez , R.E. , Seibert , J.A. , Thompson , S.K. : Comparison of dual energy detector system performance . Medical physics 31 ( 3 ), 556 – 565 ( 2004 ) OpenUrl CrossRef PubMed [8]. ↵ Kalender , W.A. , Perman , W. , Vetter , J. , Klotz , E. : Evaluation of a prototype dual-energy computed tomographic apparatus . i. phantom studies. Medical physics 13 ( 3 ), 334 – 339 ( 1986 ) OpenUrl [9]. ↵ Yu , L. , Leng , S. , McCollough , C.H. : Dual-energy ct–based monochromatic imaging . American journal of Roentgenology 199 ( 5 supplement ), 9 – 15 ( 2012 ) OpenUrl [10]. ↵ Brooks , R.A. , Di Chiro , G. : Beam hardening in x-ray reconstructive tomography . Physics in medicine & biology 21 ( 3 ), 390 ( 1976 ) OpenUrl [11]. ↵ Coleman , A. , Sinclair , M. : A beam-hardening correction using dual-energy computed tomography . Physics in medicine & biology 30 ( 11 ), 1251 ( 1985 ) OpenUrl [12]. Cardinal , H.N. , Fenster , A. : An accurate method for direct dual-energy calibration and decomposition . Medical physics 17 ( 3 ), 327 – 341 ( 1990 ) OpenUrl CrossRef PubMed [13]. Dong , X. , Niu , T. , Zhu , L. : Combined iterative reconstruction and image-domain decomposition for dual energy ct using total-variation regularization . Medical physics 41 ( 5 ), 051909 ( 2014 ) OpenUrl [14]. ↵ Zeng , D. , Huang , J. , Zhang , H. , Bian , Z. , Niu , S. , Zhang , Z. , Feng , Q. , Chen , W. , Ma , J. : Spectral ct image restoration via an average image-induced nonlocal means filter . IEEE Transactions on Biomedical Engineering 63 ( 5 ), 1044 – 1057 ( 2015 ) OpenUrl [15]. ↵ Stenner , P. , Berkus , T. , Kachelriess , M. : Empirical dual energy calibration (edec) for cone-beam computed tomography . Medical physics 34 ( 9 ), 3630 – 3641 ( 2007 ) OpenUrl PubMed [16]. ↵ Maaß , N. , Sawall , S. , Knaup , M. , Kachelrieß , M. : Empirical multiple energy calibration (emec) for material-selective ct . In: 2011 IEEE Nuclear Science Symposium Conference Record , pp. 4222 – 4229 ( 2011 ). IEEE [17]. ↵ Ying , Z. , Naidu , R. , Crawford , C.R. : Dual energy computed tomography for explosive detection . Journal of X-ray Science and Technology 14 ( 4 ), 235 – 256 ( 2006 ) OpenUrl [18]. ↵ Maaß , C. , Meyer , E. , Kachelrieß , M. : Exact dual energy material decomposition from inconsistent rays (mdir) . Medical physics 38 ( 2 ), 691 – 700 ( 2011 ) OpenUrl CrossRef PubMed [19]. ↵ Feng , C. , Shen , Q. , Kang , K. , Xing , Y. : An empirical material decomposition method (emdm) for spectral ct . In: 2016 IEEE Nuclear Science Symposium, Medical Imaging Conference and Room-Temperature Semiconductor Detector Workshop (NSS/MIC/RTSD) , pp. 1 – 5 ( 2016 ). IEEE [20]. ↵ Sukovic , P. , Clinthorne , N.H. : Penalized weighted least-squares image reconstruction for dual energy x-ray transmission tomography . IEEE transactions on medical imaging 19 ( 11 ), 1075 – 1081 ( 2000 ) OpenUrl PubMed [21]. Elbakri , I.A. , Fessler , J.A. : Statistical image reconstruction for polyenergetic x-ray computed tomography . IEEE transactions on medical imaging 21 ( 2 ), 89 – 99 ( 2002 ) OpenUrl CrossRef PubMed [22]. Xu , Q. , Mou , X. , Tang , S. , Hong , W. , Zhang , Y. , Luo , T. : Implementation of penalized-likelihood statistical reconstruction for polychromatic dualenergy ct . In: Medical Imaging 2009: Physics of Medical Imaging , vol. 7258 , pp. 1666 – 1674 ( 2009 ). SPIE OpenUrl [23]. Long , Y. , Fessler , J.A. : Multi-material decomposition using statistical image reconstruction for spectral ct . IEEE transactions on medical imaging 33 ( 8 ), 1614 – 1626 ( 2014 ) OpenUrl [24]. Niu , T. , Dong , X. , Petrongolo , M. , Zhu , L. : Iterative image-domain decomposition for dual-energy ct . Medical physics 41 ( 4 ), 041901 ( 2014 ) OpenUrl [25]. Zhang , R. , Thibault , J.-B. , Bouman , C.A. , Sauer , K.D. , Hsieh , J. : Modelbased iterative reconstruction for dual-energy x-ray ct using a joint quadratic likelihood model . IEEE transactions on medical imaging 33 ( 1 ), 117 – 134 ( 2013 ) OpenUrl [26]. Zhao , Y. , Zhao , X. , Zhang , P. : An extended algebraic reconstruction technique (e-art) for dual spectral ct . IEEE transactions on medical imaging 34 ( 3 ), 761 – 768 ( 2014 ) OpenUrl [27]. Hu , J. , Zhao , X. , Wang , F. : An extended simultaneous algebraic reconstruction technique (e-sart) for x-ray dual spectral computed tomography . Scanning 38 ( 6 ), 599 – 611 ( 2016 ) OpenUrl [28]. Chen , B. , Zhang , Z. , Sidky , E.Y. , Xia , D. , Pan , X. : Image reconstruction and scan configurations enabled by optimization-based algorithms in multispectral ct . Physics in Medicine & Biology 62 ( 22 ), 8763 ( 2017 ) OpenUrl [29]. Li , M. , Zhao , Y. , Zhang , P. : Accurate iterative fbp reconstruction method for material decomposition of dual energy ct . IEEE transactions on medical imaging 38 ( 3 ), 802 – 812 ( 2018 ) OpenUrl [30]. Zhao , S. , Pan , H. , Zhang , W. , Xia , D. , Zhao , X. : An oblique projection modification technique (opmt) for fast multispectral ct reconstruction . Physics in Medicine & Biology 66 ( 6 ), 065003 ( 2021 ) OpenUrl [31]. ↵ Zhang , W. , Zhao , S. , Pan , H. , Zhao , Y. , Zhao , X. : An iterative reconstruction method based on monochromatic images for dual energy ct . Medical Physics 48 ( 10 ), 6437 – 6452 ( 2021 ) OpenUrl [32]. ↵ Touch , M. , Clark , D.P. , Barber , W. , Badea , C.T. : A neural network-based method for spectral distortion correction in photon counting x-ray ct . Physics in Medicine & Biology 61 ( 16 ), 6132 ( 2016 ) OpenUrl [33]. Liao , Y. , Wang , Y. , Li , S. , He , J. , Zeng , D. , Bian , Z. , Ma , J. : Pseudo dual energy ct imaging using deep learning-based framework: basic material estimation . In: Medical Imaging 2018: Physics of Medical Imaging , vol. 10573 , pp. 1190 – 1194 ( 2018 ). SPIE OpenUrl [34]. Zhao , W. , Vernekohl , D. , Han , F. , Han , B. , Peng , H. , Yang , Y. , Xing , L. , Min , J.K. : A unified material decomposition framework for quantitative dual-and triple-energy ct imaging . Medical physics 45 ( 7 ), 2964 – 2977 ( 2018 ) OpenUrl [35]. Xu , Y. , Yan , B. , Chen , J. , Zeng , L. , Li , L. : Projection decomposition algorithm for dual-energy computed tomography via deep neural network . Journal of X-ray science and technology 26 ( 3 ), 361 – 377 ( 2018 ) OpenUrl [36]. Xu , Y. , Yan , B. , Zhang , J. , Chen , J. , Zeng , L. , Wang , L. : Image decomposition algorithm for dual-energy computed tomography via fully convolutional network . Computational and mathematical methods in medicine 2018 ( 2018 ) [37]. Hu , D. , Wu , W. , Xu , M. , Zhang , Y. , Liu , J. , Ge , R. , Chen , Y. , Luo , L. , Coatrieux , G. : Sister: Spectral-image similarity-based tensor with enhanced-sparsity reconstruction for sparse-view multi-energy ct . IEEE Transactions on Computational Imaging 6 , 477 – 490 ( 2019 ) OpenUrl [38]. Wu , X. , He , P. , Long , Z. , Guo , X. , Chen , M. , Ren , X. , Chen , P. , Deng , L. , An , K. , Li , P. , et al : Multi-material decomposition of spectral ct images via fully convolutional densenets . Journal of X-Ray Science and Technology 27 ( 3 ), 461 – 471 ( 2019 ) OpenUrl [39]. Li , D. , Li , S. , Zhu , M. , Gao , Q. , Bian , Z. , Huang , H. , Zhang , S. , Huang , J. , Zeng , D. , Ma , J. : Unsupervised data fidelity enhancement network for spectral ct reconstruction . In: Medical Imaging 2020: Physics of Medical Imaging , vol. 11312 , pp. 1081 – 1088 ( 2020 ). SPIE OpenUrl [40]. ↵ Yao , L. , Li , S. , Li , D. , Zhu , M. , Gao , Q. , Zhang , S. , Bian , Z. , Huang , J. , Zeng , D. , Ma , J. : Leveraging deep generative model for direct energyresolving ct imaging via existing energy-integrating ct images . In: Medical Imaging 2020: Physics of Medical Imaging , vol. 11312 , pp. 1190 – 1195 ( 2020 ). SPIE OpenUrl [41]. ↵ Shan , H. , Padole , A. , Homayounieh , F. , Kruger , U. , Khera , R.D. , Nitiwarangkul , C. , Kalra , M.K. , Wang , G. : Competitive performance of a modularized deep neural network compared to commercial algorithms for low-dose ct image reconstruction . Nature Machine Intelligence 1 ( 6 ), 269 – 276 ( 2019 ) OpenUrl [42]. ↵ Flohr , T.G. , McCollough , C.H. , Bruder , H. , Petersilka , M. , Gruber , K. , Süβ , C. , Grasruck , M. , Stierstorfer , K. , Krauss , B. , Raupach , R. , et al : First performance evaluation of a dual-source ct (dsct) system . European radiology 16 ( 2 ), 256 – 268 ( 2006 ) OpenUrl CrossRef PubMed Web of Science [43]. ↵ Primak , A. , Ramirez Giraldo , J. , Liu , X. , Yu , L. , McCollough , C.H. : Improved dual-energy material discrimination for dual-source ct by means of additional spectral filtration . Medical physics 36 ( 4 ), 1359 – 1369 ( 2009 ) OpenUrl CrossRef PubMed [44]. ↵ Genzel , M. , Gühring , I. , Macdonald , J. , März , M. : Near-exact recovery for tomographic inverse problems via deep learning . In: International Conference on Machine Learning , pp. 7368 – 7381 ( 2022 ). PMLR [45]. ↵ Würfl , T. , Hoffmann , M. , Christlein , V. , Breininger , K. , Huang , Y. , Unberath , M. , Maier , A.K. : Deep learning computed tomography: Learning projection-domain weights from image domain in limited angle problems . IEEE transactions on medical imaging 37 ( 6 ), 1454 – 1463 ( 2018 ) OpenUrl [46]. ↵ Syben , C. , Michen , M. , Stimpel , B. , Seitz , S. , Ploner , S. , Maier , A.K. : Pyro-nn: Python reconstruction operators in neural networks . Medical physics 46 ( 11 ), 5110 – 5115 ( 2019 ) OpenUrl [47]. Hu , J. , Shen , L. , Sun , G. : Squeeze-and-excitation networks . In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition , pp. 7132 – 7141 ( 2018 ) [48]. Vaswani , A. , Shazeer , N. , Parmar , N. , Uszkoreit , J. , Jones , L. , Gomez , A.N. , Kaiser , L. , Polosukhin , I. : Attention is all you need . Advances in neural information processing systems 30 ( 2017 ) [49]. Ma , G. , Zhang , Y. , Zhao , X. , Wang , T. , Li , H. : A neural network with encoded visible edge prior for limited-angle computed tomography reconstruction . Medical Physics 48 ( 10 ), 6464 – 6481 ( 2021 ) OpenUrl [50]. ↵ Reiser , I. , Nishikawa , R. : Task-based assessment of breast tomosynthesis: effect of acquisition parameters and quantum noise a . Medical physics 37 ( 4 ), 1591 – 1600 ( 2010 ) OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted January 23, 2024. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Dual-domain joint learning reconstruction method (JLRM) combined with physical process for spectral computed tomography Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Dual-domain joint learning reconstruction method (JLRM) combined with physical process for spectral computed tomography Genwei Ma , Xing Zhao medRxiv 2024.01.22.24301600; doi: https://doi.org/10.1101/2024.01.22.24301600 Share This Article: Copy Citation Tools Dual-domain joint learning reconstruction method (JLRM) combined with physical process for spectral computed tomography Genwei Ma , Xing Zhao medRxiv 2024.01.22.24301600; doi: https://doi.org/10.1101/2024.01.22.24301600 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Radiology and Imaging Subject Areas All Articles Addiction Medicine (573) Allergy and Immunology (865) Anesthesia (302) Cardiovascular Medicine (4456) Dentistry and Oral Medicine (445) Dermatology (383) Emergency Medicine (610) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1515) Epidemiology (15244) Forensic Medicine (30) Gastroenterology (1132) Genetic and Genomic Medicine (6618) Geriatric Medicine (669) Health Economics (1002) Health Informatics (4556) Health Policy (1372) Health Systems and Quality Improvement (1614) Hematology (543) HIV/AIDS (1270) Infectious Diseases (except HIV/AIDS) (15932) Intensive Care and Critical Care Medicine (1106) Medical Education (624) Medical Ethics (147) Nephrology (670) Neurology (6632) Nursing (346) Nutrition (999) Obstetrics and Gynecology (1148) Occupational and Environmental Health (957) Oncology (3347) Ophthalmology (980) Orthopedics (369) Otolaryngology (421) Pain Medicine (436) Palliative Medicine (130) Pathology (665) Pediatrics (1696) Pharmacology and Therapeutics (693) Primary Care Research (714) Psychiatry and Clinical Psychology (5463) Public and Global Health (9254) Radiology and Imaging (2210) Rehabilitation Medicine and Physical Therapy (1371) Respiratory Medicine (1197) Rheumatology (598) Sexual and Reproductive Health (715) Sports Medicine (532) Surgery (714) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a03080ca0970ad07',t:'MTc4MDAwNTMyMQ=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2024) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00