Biography
Marco Cagnazzo obtained the Laurea (equivalent to the M.S.) degree in Telecommunication Engineering from the Federico II University (Napoli, Italy) in 2002 and the Ph.D. degree in Information and Communication Technology from the Federico II University and the University of Nice-Sophia Antipolis (France) in 2005, defending a doctoral thesis entitled “Wavelet transform and three-dimensional data compression”.
He obtained research grants from the CNIT national laboratory of multimedia communication and from the Centro Regionale di Competenze sull’ICT, and has been a post-doc fellow with the team CReATIVe at the I3S laboratory in Sophia Antipolis (France). Marco Cagnazzo has been a full professor at Telecom-Paris since December 2018, within the Multimedia team where he arrived as maître de conférences (roughly equivalent to associate professor) in 2008. He has achieved the Habilitation à Diriger des Recherches de l’Université Pierre et Marie Curie (Paris) in September 2013. He has been responsible for the Multimedia team from December 2015 to September 2021. Since December 2021 he is an Associate Professor at the University of Padua and an Invited Full Professor at Telecom-Paris.
Marco Cagnazzo has been an Associate Editor for IEEE Transactions on Circuits and Systems for Video Technology and for IEEE Signal Prcessing Letters and is Area Editor for Elsevier Signal Processing: Image Communication. Since 2017, he is a member of the IEEE SPS Technical Committee on Image, Video, and Multidimensional Signal Processing (IVMSP) and of the board of the main French society on signal processing, the GRETSI (Groupe de Recherche sur le Traitement du Signal et des Images).
Moreover, he regularly serves as a reviewer for several journals (among which IEEE Transactions on Image Processing, IEEE Transactions on Circuits and Systems for Video Technology, and IEEE Transactions on Signal Processing), and as reviewer and/or area chair for such conferences as IEEE ICIP, IEEE ICASSP, Eurasip EUSIPCO, IEEE MMSP, IEEE ICME.
He is IEEE Senior Member since February 2011.
He has been on the organizing committees of the 2010 IEEE International Workshop MMSP (Electronic Media Chair) and of the European Workshop on Visual Information Processing EUVIP (Local Arrangement). Moreover, he is Publicity Chair for EUSIPCO 2012 (Bucharest) and Award Chair for ICIP 2014 (Paris).
Marco Cagnazzo speaks Italian (his mother tongue), English, and French.
Research areas
Publications
2023
Garus, P.; Milovanovic, M.; Jung, J.; Cagnazzo, M.
MPEG immersive video Book Chapter
In: Immersive Video Technologies, pp. 327–356, Academic Press, 2023.
@inbook{<LineBreak> 11577_3469279,
title = {MPEG immersive video},
author = { P. Garus and M. Milovanovic and J. Jung and M. Cagnazzo},
url = {https://doi.org/10.1016/B978-0-32-391755-1.00018-3},
year = {2023},
date = {2023-01-01},
urldate = {2023-01-01},
booktitle = {Immersive Video Technologies},
pages = {327--356},
publisher = {Academic Press},
abstract = {MPEG immersive video (MIV) is a novel standard, enabling the compression of volumetric video content. In this chapter, we describe MIV, its tools, and its profiles. Given that MIV is a video-based solution, the texture and geometry information is coded using available 2D video codecs, which are independent of MIV. We present the performance of MIV with several state-of-the-art 2D codecs: VVC, AV1, and AVS3, highlighting that the eventual success of MIV does not depend on the market share of any particular 2D codec. However, using suitable tools for the coding of MIV texture or depth map atlases is an important requirement for efficient compression of immersive video. In this context, we present results related to screen content coding tools of VVC and show their potential for the compression of MIV atlases.},
keywords = {},
pubstate = {published},
tppubtype = {inbook}
}
2022
Milovanovic, Marta; Henry, Félix; Cagnazzo, Marco
Depth Patch Selection for Decoder-Side Depth Estimation in MPEG Immersive Video Conference
Picture Coding Symposium, IEEE, 2022.
@conference{11577_3469276,
title = {Depth Patch Selection for Decoder-Side Depth Estimation in MPEG Immersive Video},
author = { Marta Milovanovic and Félix Henry and Marco Cagnazzo},
year = {2022},
date = {2022-01-01},
booktitle = {Picture Coding Symposium},
pages = {343--347},
publisher = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Karagkioules, Theodoros; Paschos, Georgios S.; Liakopoulos, Nikolaos; Fiandrotti, Attilio; Tsilimantos, Dimitrios; Cagnazzo, Marco
Online Learning for Adaptive Video Streaming in Mobile Networks Journal Article
In: ACM TRANSACTIONS ON MULTIMEDIA COMPUTING, COMMUNICATIONS AND APPLICATIONS, vol. 18, no. 1, pp. 1–22, 2022.
@article{11577_3454207,
title = {Online Learning for Adaptive Video Streaming in Mobile Networks},
author = { Theodoros Karagkioules and Georgios S. Paschos and Nikolaos Liakopoulos and Attilio Fiandrotti and Dimitrios Tsilimantos and Marco Cagnazzo},
url = {https://dl.acm.org/doi/10.1145/3460819},
doi = {10.1145/3460819},
year = {2022},
date = {2022-01-01},
journal = {ACM TRANSACTIONS ON MULTIMEDIA COMPUTING, COMMUNICATIONS AND APPLICATIONS},
volume = {18},
number = {1},
pages = {1--22},
publisher = {ACM},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Vijayaratnam, Melan; Cagnazzo, Marco; Valenzise, Giuseppe; Trioux, Anthony; Kieffer, Michel
Towards zero-latency video transmission through frame extrapolation Conference
IEEE International Conference on Image Processing, 2022.
@conference{11577_3469277,
title = {Towards zero-latency video transmission through frame extrapolation},
author = { Melan Vijayaratnam and Marco Cagnazzo and Giuseppe Valenzise and Anthony Trioux and Michel Kieffer},
year = {2022},
date = {2022-01-01},
booktitle = {IEEE International Conference on Image Processing},
pages = {2122--2126},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Vijaratnam, Melan; Cagnazzo, Marco; Valenzise, Giuseppe; Trioux, Anthony; Kieffer, Michel
Vers une transmission vidéo sans latence par l’extrapolation d’images Conference
XXVIIIème Colloque Francophone de Traitement du Signal et des Images, 2022.
@conference{11577_3469278,
title = {Vers une transmission vidéo sans latence par l'extrapolation d'images},
author = { Melan Vijaratnam and Marco Cagnazzo and Giuseppe Valenzise and Anthony Trioux and Michel Kieffer},
year = {2022},
date = {2022-01-01},
booktitle = {XXVIIIème Colloque Francophone de Traitement du Signal et des Images},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
2021
Chen, Zhibo; Herglotz, Christian; Cagnazzo, Marco
Editorial to the Special Section on Optimized Image/Video Coding Based on Deep Learning Journal Article
In: IEEE OPEN JOURNAL OF CIRCUITS AND SYSTEMS, vol. 2, pp. 611–612, 2021.
@article{11577_3469280,
title = {Editorial to the Special Section on Optimized Image/Video Coding Based on Deep Learning},
author = { Zhibo Chen and Christian Herglotz and Marco Cagnazzo},
year = {2021},
date = {2021-01-01},
journal = {IEEE OPEN JOURNAL OF CIRCUITS AND SYSTEMS},
volume = {2},
pages = {611--612},
publisher = {IEEE},
abstract = {This Special Section of the IEEE Open Journal of Circuits and Systems is dedicated to a collection of articles on Optimized Image/Video Coding based on Deep Learning, to promote techniques in algorithms, implementations, and applications in this highly active field of research. This Special Section covers articles in three categories including end-to-end image/video coding optimization, learning techniques for optimizing traditional image/video codecs, and coding for machine vision applications},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Hobloss, Nour; Zhang, Lu; Cagnazzo, Marco
A Multi-View Stereoscopic Video Database With Green Screen (MTF) For Video Transition Quality-of-Experience Assessment Conference
2021 13th International Conference on Quality of Multimedia Experience (QoMEX), 2021.
@conference{11577_3469283,
title = {A Multi-View Stereoscopic Video Database With Green Screen (MTF) For Video Transition Quality-of-Experience Assessment},
author = { Nour Hobloss and Lu Zhang and Marco Cagnazzo},
year = {2021},
date = {2021-01-01},
booktitle = {2021 13th International Conference on Quality of Multimedia Experience (QoMEX)},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Tworski, Marcelin; Lathuilière, Stéphane; Belkarfa, Salim; Fiandrotti, Attilio; Cagnazzo, Marco
DR2S: Deep Regression with Region Selection for Camera Quality Evaluation Conference
2020 25th International Conference on Pattern Recognition (ICPR), 2021.
@conference{11577_3469285,
title = {DR2S: Deep Regression with Region Selection for Camera Quality Evaluation},
author = { Marcelin Tworski and Stéphane Lathuilière and Salim Belkarfa and Attilio Fiandrotti and Marco Cagnazzo},
year = {2021},
date = {2021-01-01},
booktitle = {2020 25th International Conference on Pattern Recognition (ICPR)},
pages = {6173--6180},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Tartaglione, Enzo; Lathuilière, Stéphane; Fiandrotti, Attilio; Cagnazzo, Marco; Grangetto, Marco
HEMP: High-order entropy minimization for neural network compression Journal Article
In: NEUROCOMPUTING, vol. 461, pp. 244–253, 2021.
@article{11577_3469257,
title = {HEMP: High-order entropy minimization for neural network compression},
author = { Enzo Tartaglione and Stéphane Lathuilière and Attilio Fiandrotti and Marco Cagnazzo and Marco Grangetto},
url = {https://doi.org/10.1016/j.neucom.2021.07.022},
year = {2021},
date = {2021-01-01},
journal = {NEUROCOMPUTING},
volume = {461},
pages = {244--253},
publisher = {Elsevier},
abstract = {We formulate the entropy of a quantized artificial neural network as a differentiable function that can be plugged as a regularization term into the cost function minimized by gradient descent. Our formulation scales efficiently beyond the first order and is agnostic of the quantization scheme. The network can then be trained to minimize the entropy of the quantized parameters, so that they can be optimally compressed via entropy coding. We experiment with our entropy formulation at quantizing and compressing well-known network architectures over multiple datasets. Our approach compares favorably over similar methods, enjoying the benefits of higher order entropy estimate, showing flexibility towards non-uniform quantization (we use Lloyd-max quantization), scalability towards any entropy order to be minimized and efficiency in terms of compression. We show that HEMP is able to work in synergy with other approaches aiming at pruning or quantizing the model itself, delivering significant benefits in terms of storage size compressibility without harming the model’s performance.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Trioux, Anthony; Valenzise, Giuseppe; Cagnazzo, Marco; Kieffer, Michel; Coudoux, François-Xavier; Corlay, Patrick; Gharbi, Mohamed
A Perceptual Study of the Decoding Process of the SoftCast Wireless Video Broadcast Scheme Conference
2021 IEEE 23rd International Workshop on Multimedia Signal Processing (MMSP), 2021.
@conference{11577_3469282,
title = {A Perceptual Study of the Decoding Process of the SoftCast Wireless Video Broadcast Scheme},
author = { Anthony Trioux and Giuseppe Valenzise and Marco Cagnazzo and Michel Kieffer and François-Xavier Coudoux and Patrick Corlay and Mohamed Gharbi},
year = {2021},
date = {2021-01-01},
booktitle = {2021 IEEE 23rd International Workshop on Multimedia Signal Processing (MMSP)},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Milovanovic, Marta; Jung, Joël; Cagnazzo, Marco
Patch decoder-side depth estimation in MPEG immersive video Conference
2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), 2021.
@conference{11577_3469284,
title = {Patch decoder-side depth estimation in MPEG immersive video},
author = { Marta Milovanovic and Joël Jung and Marco Cagnazzo},
year = {2021},
date = {2021-01-01},
booktitle = {2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Hobloss, N.; Zhang, L.; Lathuiliere, S.; Cagnazzo, M.; Fiandrotti, A.
Hybrid dual stream blender for wide baseline view synthesis Journal Article
In: SIGNAL PROCESSING-IMAGE COMMUNICATION, vol. 97, 2021.
@article{11577_3451587,
title = {Hybrid dual stream blender for wide baseline view synthesis},
author = { N. Hobloss and L. Zhang and S. Lathuiliere and M. Cagnazzo and A. Fiandrotti},
url = {https://www.sciencedirect.com/science/article/pii/S0923596521001685},
doi = {10.1016/j.image.2021.116366},
year = {2021},
date = {2021-01-01},
journal = {SIGNAL PROCESSING-IMAGE COMMUNICATION},
volume = {97},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
2020
Nasrallah, Anthony; Guionnet, Thomas; Abdoli, Mohsen; Cagnazzo, Marco; Fiandrotti, Attilio
METHOD FOR IMAGE PROCESSING AND APPARATUS FOR IMPLEMENTING THE SAME Miscellaneous
2020.
@misc{11577_3471606,
title = {METHOD FOR IMAGE PROCESSING AND APPARATUS FOR IMPLEMENTING THE SAME},
author = { Anthony Nasrallah and Thomas Guionnet and Mohsen Abdoli and Marco Cagnazzo and Attilio Fiandrotti},
year = {2020},
date = {2020-01-01},
abstract = {A method of processing a first image in a first plurality of images, wherein the first image is divided into a plurality of pixel blocks, is proposed, which comprises, for a current block of the first image: selecting, in a set of a plurality of predefined interpolation filters, an interpolation filter based on a prediction of an interpolation filter determined by a supervised learning algorithm to which data related to the current block is input; and using the selected interpolation filter for calculating fractional pixel values in a second image of the plurality of images for a temporal prediction of pixels of the current block based on a reference block correlated to the current block in the second image, wherein the second image is distinct from the first image and was previously encoded according to an image encoding sequence for encoding the images of the plurality of images.},
keywords = {},
pubstate = {published},
tppubtype = {misc}
}
Rhammad, A El; Gioia, P; Gilles, A; Cagnazzo, Marco
Progressive hologram transmission using a view-dependent scalable compression scheme Journal Article
In: ANNALES DES TÉLÉCOMMUNICATIONS, vol. 75, no. 5-6, pp. 201–214, 2020.
@article{11577_3469271,
title = {Progressive hologram transmission using a view-dependent scalable compression scheme},
author = { A El Rhammad and P Gioia and A Gilles and Marco Cagnazzo},
doi = {10.1007/s12243-019-00741-7},
year = {2020},
date = {2020-01-01},
journal = {ANNALES DES TÉLÉCOMMUNICATIONS},
volume = {75},
number = {5-6},
pages = {201--214},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Zheng, Shuo; Cagnazzo, Marco; Kieffer, Michel
Channel Impulsive Noise Mitigation for Linear Video Coding Schemes Journal Article
In: IEEE TRANSACTIONS ON CIRCUITS AND SYSTEMS FOR VIDEO TECHNOLOGY, vol. 30, no. 9, pp. 3196–3209, 2020.
@article{11577_3469258,
title = {Channel Impulsive Noise Mitigation for Linear Video Coding Schemes},
author = { Shuo Zheng and Marco Cagnazzo and Michel Kieffer},
doi = {10.1109/TCSVT.2019.2937451},
year = {2020},
date = {2020-01-01},
journal = {IEEE TRANSACTIONS ON CIRCUITS AND SYSTEMS FOR VIDEO TECHNOLOGY},
volume = {30},
number = {9},
pages = {3196--3209},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Trioux, A.; Valenzise, G.; Cagnazzo, M.; Kieffer, M.; Coudoux, F. -X.; Corlay, P.; Gharbi, M.
Subjective and Objective Quality Assessment of the SoftCast Video Transmission Scheme Conference
2020 IEEE International Conference on Visual Communications and Image Processing, VCIP 2020, Institute of Electrical and Electronics Engineers Inc., 2020, ISBN: 978-1-7281-8068-7.
@conference{11577_3469351,
title = {Subjective and Objective Quality Assessment of the SoftCast Video Transmission Scheme},
author = { A. Trioux and G. Valenzise and M. Cagnazzo and M. Kieffer and F. -X. Coudoux and P. Corlay and M. Gharbi},
doi = {10.1109/VCIP49819.2020.9301778},
isbn = {978-1-7281-8068-7},
year = {2020},
date = {2020-01-01},
booktitle = {2020 IEEE International Conference on Visual Communications and Image Processing, VCIP 2020},
pages = {96--99},
publisher = {Institute of Electrical and Electronics Engineers Inc.},
abstract = {SoftCast-based linear video coding and transmission (LVCT) schemes have been proposed as a promising alternative to traditional video coding and transmission schemes in wireless environments. Currently, the performance of LVCT schemes is evaluated by means of traditional objective scores such as PSNR or SSIM. Nevertheless, since the compression is performed in a very different way from traditional coding schemes such as HEVC, visual artifacts are also quite different and deserve to be subjectively assessed. In this paper, we propose a subjective quality assessment of SoftCast, pioneer and standard of the LVCT schemes. This study aims to better understand the trade-offs between the LVCT parameters that can be tuned to improve the quality. These parameters, including different GoP-sizes, Compression Ratios (CR) and Channel Signal-to-Noise Ratio (CSNR), are used to generate a dataset of 85 videos. A Double Stimulus Impairment Scale (DSIS) test is performed on the received videos to assess the perceived quality. Results show that the key characteristic of SoftCast, the linear relation between CSNR and PSNR, is also observed with the Mean-Opinion Scores (MOS), except at high CSNR where the quality saturates. In addition, Bjontegaard model is used to quantify the trade-offs between CR, GoP-size and CSNR, depending on the intended application. Finally, the performance of objective metrics compared to the obtained MOS is evaluated. Results show that Multi-Scale SSIM (MS-SSIM), SSIM and Video Multimethod Assessment Fusion (VMAF) metrics offer the best correlation with the MOS values.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
2019
RHAMMAD, Anas EL; Gilles, Antonin; Gioia, Patrick; Cagnazzo, Marco
METHOD AND DEVICE FOR TRANSMITTING DATA REPRESENTING A DIGITAL HOLOGRAM Miscellaneous
2019.
@misc{11577_3472307,
title = {METHOD AND DEVICE FOR TRANSMITTING DATA REPRESENTING A DIGITAL HOLOGRAM},
author = { Anas EL RHAMMAD and Antonin Gilles and Patrick Gioia and Marco Cagnazzo},
year = {2019},
date = {2019-01-01},
abstract = {A method for transmitting data representing a digital hologram (H) represented by a set of atoms (ak) each having a diffraction spectrum (Sk) in an observation plane (PO) comprising the following steps: - determining an order for the sets (ak) each comprising at least one atom (ak), as a function of a distance, in the observation plane (PO), between an observation position (O) and a position (Ck) associated with the relevant set (ak); - transmitting, for at least part of said sets (ak) and in the determined order, descriptive data of said at least one atom (ak) included in the relevant set (ak). An associated transmission device is also described.},
keywords = {},
pubstate = {published},
tppubtype = {misc}
}
Zheng, S; Cagnazzo, Marco; Kieffer, M
Optimal and suboptimal channel precoding and decoding matrices for linear video coding Journal Article
In: SIGNAL PROCESSING-IMAGE COMMUNICATION, vol. 78, pp. 135–151, 2019.
@article{11577_3469272,
title = {Optimal and suboptimal channel precoding and decoding matrices for linear video coding},
author = { S Zheng and Marco Cagnazzo and M Kieffer},
doi = {10.1016/j.image.2019.06.011},
year = {2019},
date = {2019-01-01},
journal = {SIGNAL PROCESSING-IMAGE COMMUNICATION},
volume = {78},
pages = {135--151},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Mitrica, I; Mercier, E; Ruellan, C; Fiandrotti, A; Cagnazzo, Marco; Pesquet-Popescu, B
Very Low Bitrate Semantic Compression of Airplane Cockpit Screen Content Journal Article
In: IEEE TRANSACTIONS ON MULTIMEDIA, vol. 21, no. 9, pp. 2157–2170, 2019.
@article{11577_3469273,
title = {Very Low Bitrate Semantic Compression of Airplane Cockpit Screen Content},
author = { I Mitrica and E Mercier and C Ruellan and A Fiandrotti and Marco Cagnazzo and B Pesquet-Popescu},
doi = {10.1109/TMM.2019.2900168},
year = {2019},
date = {2019-01-01},
journal = {IEEE TRANSACTIONS ON MULTIMEDIA},
volume = {21},
number = {9},
pages = {2157--2170},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Cagnazzo, Marco; Fiandrotti, Attilio; Ruellan, Christophe
METHOD FOR COMPRESSING A SEQUENCE OF IMAGES DISPLAYING SYNTHETIC GRAPHICAL ELEMENTS OF NON-PHOTOGRAPHIC ORIGIN Miscellaneous
2019.
@misc{11577_3472305,
title = {METHOD FOR COMPRESSING A SEQUENCE OF IMAGES DISPLAYING SYNTHETIC GRAPHICAL ELEMENTS OF NON-PHOTOGRAPHIC ORIGIN},
author = { Marco Cagnazzo and Attilio Fiandrotti and Christophe Ruellan},
year = {2019},
date = {2019-01-01},
abstract = {Method for compressing a sequence of images comprising a first image and a second image, the method comprising the steps of: generating (102) a first descriptor comprising parameters for displaying a computer-generated graphical element in the first image, the graphical element being of non-photographic origin, and the display parameters not comprising pixel values; processing the second image so as to determine (208) an event which gave rise to a potential variation in the parameters for displaying the graphical element between the first image and the second image; generating (210) a second descriptor comprising an event code indicating the determined event.},
keywords = {},
pubstate = {published},
tppubtype = {misc}
}
Rhammad, A. El; Gioia, P.; Gilles, A.; Cagnazzo, M.
Towards practical hologram streaming using progressive coding Conference
Proceedings of SPIE – The International Society for Optical Engineering, vol. 11137, SPIE, 2019.
@conference{11577_3469353,
title = {Towards practical hologram streaming using progressive coding},
author = { A. El Rhammad and P. Gioia and A. Gilles and M. Cagnazzo},
doi = {10.1117/12.2529202},
year = {2019},
date = {2019-01-01},
booktitle = {Proceedings of SPIE - The International Society for Optical Engineering},
volume = {11137},
publisher = {SPIE},
abstract = {Digital holography is an emerging technology for 3D visualization which is expected to dethrone conventional stereoscopic devices in the future. Aside from their specific signal properties, high quality holograms with broad viewing angles contain massive amount of data. For a reasonable transmission time, efficient scalable compression schemes are needed to bridge the gap between the overwhelming volume of data and the limited bandwidth of the communication channels. The viewpoint scalability is a powerful property since it allows to encode and transmit only the information corresponding to the observer's view. However, this approach imposes an online encoding at the server which may increase the latency of the transmission chain. To overcome this hurdle, we propose a scalable compression framework based on Gabor-wavelets decomposition, where the whole hologram is encoded offline. First, the observer plane is divided into spatial blocks. Then, the Gabor atoms are assigned to these blocks by exploiting the duality between Gabor wavelets and light rays. The atoms of each block are then classified into different layers according to their importance for the reconstruction and encoded in packets. At the decoder side, the atoms' packets are progressively decoded based on the viewer's position. Then, the corresponding sub-hologram is generated using a GPU implementation. Results show that our approach enables a practical progressive streaming of digital holograms with a low latency.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Rhammad, A. E.; Gioia, P.; Gilles, A.; Cagnazzo, M.
Scalable Coding Framework for a View-Dependent Streaming of Digital Holograms Conference
Proceedings – International Conference on Image Processing, ICIP, vol. 2019-, IEEE Computer Society, 2019.
@conference{11577_3469357,
title = {Scalable Coding Framework for a View-Dependent Streaming of Digital Holograms},
author = { A. E. Rhammad and P. Gioia and A. Gilles and M. Cagnazzo},
doi = {10.1109/ICIP.2019.8802950},
year = {2019},
date = {2019-01-01},
booktitle = {Proceedings - International Conference on Image Processing, ICIP},
volume = {2019-},
pages = {146--150},
publisher = {IEEE Computer Society},
abstract = {Unlike conventional images and videos, digital holograms contain large amounts of data with very low redundancy. Consequently, current communication networks may be not able to meet the bandwidth requirements for hologram transmission in reasonable time. To enable practical streaming of holographic contents, we propose a progressive coding method that combines quality scalability with viewpoint scalability. From a Gabor wavelets decomposition of the hologram, the server starts by selecting the coefficients corresponding to the user's viewpoint. Then, the selected coefficients are encoded progressively according to their importance for the reconstructed view. Experimental results reveal that our approach outperforms conventional scalable codecs and enables the streaming of holographic data with a better quality of experience.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Hobloss, N.; Purica, A.; Fiandrotti, A.; Cagnazzo, M.; Cozot, R.; Hamidouche, W.
A Hybrid Approach to Wide Baseline View Synthesis with Convolutional Neural Networks Conference
2019 International Conference on 3D Immersion, IC3D 2019 – Proceedings, vol. 2019-, Institute of Electrical and Electronics Engineers Inc., 2019, ISBN: 978-1-7281-5189-2.
@conference{11577_3469356,
title = {A Hybrid Approach to Wide Baseline View Synthesis with Convolutional Neural Networks},
author = { N. Hobloss and A. Purica and A. Fiandrotti and M. Cagnazzo and R. Cozot and W. Hamidouche},
doi = {10.1109/IC3D48390.2019.8976000},
isbn = {978-1-7281-5189-2},
year = {2019},
date = {2019-01-01},
booktitle = {2019 International Conference on 3D Immersion, IC3D 2019 - Proceedings},
volume = {2019-},
pages = {1--7},
publisher = {Institute of Electrical and Electronics Engineers Inc.},
abstract = {Convolutional Neural Networks (CNN) have been recently employed for implementing complete end-to-end view synthesis architectures, from reference view warping to target view blending while dealing with occlusions as well. However, the convolutional sizes filters must increase with the distance between reference views, making all-convolutional approaches prohibitively complex for wide baseline setups. In this work we propose a hybrid approach to view synthesis where we first warp the reference views resolving the occlusions, and then we train a simpler convolutional architecture for blending the preprocessed views. By warping the reference views, we reduce the equivalent distance between reference views, allowing the use of smaller convolutional filters and thus lower network complexity. We experimentally show that our method performs favorably against both traditional and convolutional synthesis methods while retaining lower complexity with respect to the latter.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Wang, L.; Fiandrotti, A.; Purica, A.; Valenzise, G.; Cagnazzo, M.
Enhancing HEVC Spatial Prediction by Context-based Learning Conference
ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing – Proceedings, vol. 2019-, Institute of Electrical and Electronics Engineers Inc., 2019.
@conference{11577_3469355,
title = {Enhancing HEVC Spatial Prediction by Context-based Learning},
author = { L. Wang and A. Fiandrotti and A. Purica and G. Valenzise and M. Cagnazzo},
doi = {10.1109/ICASSP.2019.8683624},
year = {2019},
date = {2019-01-01},
booktitle = {ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings},
volume = {2019-},
pages = {4035--4039},
publisher = {Institute of Electrical and Electronics Engineers Inc.},
abstract = {Deep generative models have been recently employed to compress images, image residuals or to predict image regions. Based on the observation that state-of-the-art spatial prediction is highly optimized from a rate-distortion point of view, in this work we study how learning-based approaches might be used to further enhance this prediction. To this end, we propose an encoder-decoder convolutional network able to reduce the energy of the residuals of HEVC intra prediction, by leveraging the available context of previously decoded neigh-boring blocks. The proposed context-based prediction enhancement (CBPE) scheme enables to reduce the mean square error of HEVC prediction by 25% on average, without any additional signalling cost in the bitstream.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Nikitin, P.; Jung, J.; Cagnazzo, M.; Fiandrotti, A.
Exploiting View synthesis for super-multiview video compression Conference
ACM International Conference Proceeding Series, Association for Computing Machinery, 2019, ISBN: 9781450371896.
@conference{11577_3469354,
title = {Exploiting View synthesis for super-multiview video compression},
author = { P. Nikitin and J. Jung and M. Cagnazzo and A. Fiandrotti},
doi = {10.1145/3349801.3349820},
isbn = {9781450371896},
year = {2019},
date = {2019-01-01},
booktitle = {ACM International Conference Proceeding Series},
pages = {1--6},
publisher = {Association for Computing Machinery},
abstract = {Super-multiview video consists in a 2D arrangement of cameras acquiring the same scene and it is a well-suited format for immersive and free navigation video services. However, the large number of acquired viewpoints calls for extremely effective compression tools. View synthesis allows to reconstruct a viewpoint using nearby cameras texture and depth information. In this work we explore the potential of recent advances in view synthesis algorithms to enhance the compression performances of super-multiview video. Towards this end we consider five methods that replace one viewpoint with a synthesized view, possibly enhanced with some side information. Our experiments suggest that, if the geometry information (i.e. depth map) is reliable, these methods have the potential to improve rate-distortion performance with respect to traditional approaches, at least for some specific content and configuration. Moreover, our results shed some light about how to further improve compression performance by integrating new view-synthesis prediction tools within a 3D video encoder.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Mitrica, I.; Fiandrotti, A.; Cagnazzo, M.; Mercier, E.; Ruellan, C.
Cockpit Video Coding with Temporal Prediction Conference
EUVIP, vol. 2019-October, 2019.
@conference{11577_3469350,
title = {Cockpit Video Coding with Temporal Prediction},
author = { I. Mitrica and A. Fiandrotti and M. Cagnazzo and E. Mercier and C. Ruellan},
doi = {10.1109/EUVIP47703.2019.8946234},
year = {2019},
date = {2019-01-01},
booktitle = {EUVIP},
volume = {2019-October},
pages = {28--33},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Nikitin, P.; Cagnazzo, M.; Jung, J.
Compression Improvement via Reference Organization for 2D-multiview Content Conference
ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing – Proceedings, vol. 2019-, Institute of Electrical and Electronics Engineers Inc., 2019.
@conference{11577_3469352,
title = {Compression Improvement via Reference Organization for 2D-multiview Content},
author = { P. Nikitin and M. Cagnazzo and J. Jung},
doi = {10.1109/ICASSP.2019.8682999},
year = {2019},
date = {2019-01-01},
booktitle = {ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings},
volume = {2019-},
pages = {1612--1616},
publisher = {Institute of Electrical and Electronics Engineers Inc.},
abstract = {One of the most challenging goals of future immersive services is to enable the observation of a scene from any viewpoint, thus making free-navigation possible under certain constraints. In order to provide such kind of services with smooth navigation, a huge amount of views should be available on the client's device. In particular, it is important for the case of 2D-multiview content, where cameras are positioned on a 2D grid in order to provide both horizontal and vertical parallax. This kind of content requires a large coding rate; therefore improving the compression performance of video encoders is especially relevant in this case. This paper studies how the encoder configuration affects the compression, by taking into account the spatial position of each camera. Four parameters are addressed in this work: coding order of the views, the number of reference lists, the number of reference pictures, and the ordering of pictures in the reference lists. An average of 12.0% bitrate saving is achieved for medium bitrate and 11.1% for low bitrate compared to the state of the art techniques.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
2018
Zheng, S.; Cagnazzo, M.; Kieffer, M.
Precoding Matrix Design in Linear Video Coding Conference
ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing – Proceedings, vol. 2018-, Institute of Electrical and Electronics Engineers Inc., 2018, ISBN: 978-1-5386-4658-8.
@conference{11577_3472323,
title = {Precoding Matrix Design in Linear Video Coding},
author = { S. Zheng and M. Cagnazzo and M. Kieffer},
doi = {10.1109/ICASSP.2018.8461287},
isbn = {978-1-5386-4658-8},
year = {2018},
date = {2018-01-01},
booktitle = {ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings},
volume = {2018-},
pages = {1198--1202},
publisher = {Institute of Electrical and Electronics Engineers Inc.},
abstract = {Linear video coding (LVC) is a promising alternative to classical video coding when video has to be transmitted to wireless receivers experiencing different and time-varying channel conditions. This paper addresses the LVC channel precoding and decoding matrix design when the transmission channel consists of several sub-channels, each with its own power constraint. Such constraints may be found, e.g., in multi-antenna, DSL, or powerline transmission systems. In a previous paper, it has been shown that this matrix design problem may be addressed by an adaptation to LVC of a multi-level water-filling solution proposed for MIMO channels. Here, two suboptimal low-complexity multi-level water-filling techniques are proposed, with different trade-offs between complexity and efficiency. Extensive simulations show that the suboptimal solutions perform very close to the optimal one, with a sensibly reduced complexity.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Rhammad, A. El; Gioia, P.; Gilles, A.; Cagnazzo, M.; Pesquet-Popescu, B.
View-dependent compression of digital hologram based on matching pursuit Conference
Proceedings of SPIE – The International Society for Optical Engineering, vol. 10679, SPIE, 2018.
@conference{11577_3469360,
title = {View-dependent compression of digital hologram based on matching pursuit},
author = { A. El Rhammad and P. Gioia and A. Gilles and M. Cagnazzo and B. Pesquet-Popescu},
doi = {10.1117/12.2315233},
year = {2018},
date = {2018-01-01},
booktitle = {Proceedings of SPIE - The International Society for Optical Engineering},
volume = {10679},
publisher = {SPIE},
abstract = {In this paper we investigate the suitability of Gabor Wavelets for an adaptive partial reconstruction of holograms based on the viewer position. Matching Pursuit is used for a sparse light rays decomposition of holographic patterns. At the decoding stage, sub-holograms are generated by selecting the diffracted rays corresponding to a specific area of visualization. The use of sub-holograms has been suggested in the literature as an alternative to full compression, by degrading a hologram with respect to the directional degrees of freedom. We present our approach in a complete framework for color digital holograms compression and explain, in details, how it can be efficiently exploited in the context of holographic Head-Mounted Displays. Among other aspects, encoding, adaptive reconstruction and selective degradation are studied.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Valenzise, G.; Purica, A.; Hulusic, V.; Cagnazzo, M.
Quality assessment of deep-learning-based image compression Conference
2018 IEEE 20th International Workshop on Multimedia Signal Processing, MMSP 2018, Institute of Electrical and Electronics Engineers Inc., 2018, ISBN: 978-1-5386-6070-6.
@conference{11577_3469358,
title = {Quality assessment of deep-learning-based image compression},
author = { G. Valenzise and A. Purica and V. Hulusic and M. Cagnazzo},
doi = {10.1109/MMSP.2018.8547064},
isbn = {978-1-5386-6070-6},
year = {2018},
date = {2018-01-01},
booktitle = {2018 IEEE 20th International Workshop on Multimedia Signal Processing, MMSP 2018},
pages = {1--6},
publisher = {Institute of Electrical and Electronics Engineers Inc.},
abstract = {Image compression standards rely on predictive coding, transform coding, quantization and entropy coding, in order to achieve high compression performance. Very recently, deep generative models have been used to optimize or replace some of these operations, with very promising results. However, so far no systematic and independent study of the coding performance of these algorithms has been carried out. In this paper, for the first time, we conduct a subjective evaluation of two recent deep-learning-based image compression algorithms, comparing them to JPEG 2000 and to the recent BPG image codec based on HEVC Intra. We found that compression approaches based on deep auto-encoders can achieve coding performance higher than JPEG 2000, and sometimes as good as BPG. We also show experimentally that the PSNR metric is to be avoided when evaluating the visual quality of deep-learning-based methods, as their artifacts have different characteristics from those of DCT or wavelet-based codecs. In particular, images compressed at low bitrate appear more natural than JPEG 2000 coded pictures, according to a no-reference naturalness measure. Our study indicates that deep generative models are likely to bring huge innovation into the video coding arena in the coming years.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Rhammad, A. El; Gioia, P.; Gilles, A.; Cagnazzo, M.; Pesquet-Popescu, B.
Color digital hologram compression based on matching pursuit Journal Article
In: APPLIED OPTICS, vol. 57, no. 17, pp. 4930–4942, 2018.
@article{<LineBreak> 11577_3469275,
title = {Color digital hologram compression based on matching pursuit},
author = { A. El Rhammad and P. Gioia and A. Gilles and M. Cagnazzo and B. Pesquet-Popescu},
doi = {10.1364/AO.57.004930},
year = {2018},
date = {2018-01-01},
urldate = {2018-01-01},
journal = {APPLIED OPTICS},
volume = {57},
number = {17},
pages = {4930--4942},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
2017
Mora, E. G.; Cagnazzo, M.; Dufaux, F.
AVC to HEVC transcoder based on quadtree limitation Journal Article
In: MULTIMEDIA TOOLS AND APPLICATIONS, vol. 76, no. 6, pp. 8991–9015, 2017.
@article{11577_3469361,
title = {AVC to HEVC transcoder based on quadtree limitation},
author = { E. G. Mora and M. Cagnazzo and F. Dufaux},
doi = {10.1007/s11042-016-3498-8},
year = {2017},
date = {2017-01-01},
journal = {MULTIMEDIA TOOLS AND APPLICATIONS},
volume = {76},
number = {6},
pages = {8991--9015},
publisher = {Springer New York LLC},
abstract = {Following the finalization of the state-of-the-art High Efficiency Video Coding (HEVC) standard in January 2013, several new services are being deployed in order to take advantage of the superior coding efficiency (estimated at 50 % less bitrate for the same visual quality) that this standard provides over its predecessor: H.264 / Advanced Video Coding (AVC). However, the switch from AVC to HEVC is not trivial as most video content is still encoded in AVC. Consequently, there is a growing need for fast AVC to HEVC transcoders in the market today. While a trivial transcoder can be made by simply cascading an AVC decoder and an HEVC encoder, fast transcoding cannot be achieved. In this paper, we present an AVC to HEVC transcoder where decoded AVC blocks are first fused according to their motion similarity. The resulting fusion map is then used to limit the quadtree of HEVC coded frames. AVC motion vectors are also used to determine a better starting point for integer motion estimation. Experimental results show that significant transcoder execution time savings of 63 % can be obtained with only a 1.4 % bitrate increase compared to the trivial transcoder.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Nikitin, P.; Jung, J.; Cagnazzo, M.; Pesquet, B.
Impact of the Compression of Reference Views on View Synthesis Performance Miscellaneous
2017.
@misc{11577_3472321,
title = {Impact of the Compression of Reference Views on View Synthesis Performance},
author = { P. Nikitin and J. Jung and M. Cagnazzo and B. Pesquet},
year = {2017},
date = {2017-01-01},
booktitle = {MPEG Document 40890. MPEG meeting (Turin, Italy) July 2017},
keywords = {},
pubstate = {published},
tppubtype = {misc}
}
Fiengo, A.; Chierchia, G.; Cagnazzo, M.; Pesquet-Popescu, B.
Rate allocation in predictive video coding using a convex optimization framework Journal Article
In: IEEE TRANSACTIONS ON IMAGE PROCESSING, vol. 26, no. 1, pp. 479–489, 2017.
@article{11577_3469362,
title = {Rate allocation in predictive video coding using a convex optimization framework},
author = { A. Fiengo and G. Chierchia and M. Cagnazzo and B. Pesquet-Popescu},
doi = {10.1109/TIP.2016.2621666},
year = {2017},
date = {2017-01-01},
journal = {IEEE TRANSACTIONS ON IMAGE PROCESSING},
volume = {26},
number = {1},
pages = {479--489},
publisher = {Institute of Electrical and Electronics Engineers Inc.},
abstract = {Optimal rate allocation is among the most challenging tasks to perform in the context of predictive video coding, because of the dependencies between frames induced by motion compensation. In this paper, using a recursive rate-distortion model that explicitly takes into account these dependencies, we approach the frame-level rate allocation as a convex optimization problem. This technique is integrated into the recent HEVC encoder, and tested on several standard sequences. Experiments indicate that the proposed rate allocation ensures a better performance (in the rate-distortion sense) than the standard HEVC rate control, and with a little loss with respect to an optimal exhaustive research, which is largely compensated by a much shorter execution time.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
2016
Calemme, Marco; Zanuttigh, Pietro; Milani, Simone; Cagnazzo, Marco; Pesquet-Popescu, Beatrice
Depth map coding with elastic contours and 3D surface prediction Proceedings Article
In: 2016 IEEE International Conference on Image Processing (ICIP), pp. 1106–1110, IEEE 2016.
@inproceedings{Calemme2016,
title = {Depth map coding with elastic contours and 3D surface prediction},
author = {Marco Calemme and Pietro Zanuttigh and Simone Milani and Marco Cagnazzo and Beatrice Pesquet-Popescu},
year = {2016},
date = {2016-01-01},
booktitle = {2016 IEEE International Conference on Image Processing (ICIP)},
pages = {1106--1110},
organization = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Calemme, Marco; Zanuttigh, Pietro; Milani, Simone; Cagnazzo, Marco; Popescu, Beatrice Pesquet
Depth map coding with elastic contours and 3D surface prediction Conference
Proceedings of IEEE International Conference on Image Processing (ICIP), 2016, ISBN: 978-1-4673-9961-6.
@conference{11577_3214371,
title = {Depth map coding with elastic contours and 3D surface prediction},
author = { Marco Calemme and Pietro Zanuttigh and Simone Milani and Marco Cagnazzo and Beatrice Pesquet Popescu},
doi = {10.1109/ICIP.2016.7532529},
isbn = {978-1-4673-9961-6},
year = {2016},
date = {2016-01-01},
booktitle = {Proceedings of IEEE International Conference on Image Processing (ICIP)},
pages = {1106--1110},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Jung, Joël; Dricot, Antoine; Cagnazzo, Marco; PESQUET-POPESCU, Béatrice
METHOD AND DEVICE FOR CODING AND DECODING A MULTI-VIEW SEQUENCE Miscellaneous
2016.
@misc{11577_3472318,
title = {METHOD AND DEVICE FOR CODING AND DECODING A MULTI-VIEW SEQUENCE},
author = { Joël Jung and Antoine Dricot and Marco Cagnazzo and Béatrice PESQUET-POPESCU},
year = {2016},
date = {2016-01-01},
abstract = {The invention relates to a method for decoding a stream of coded data representative of a video comprising at least one first view and a second view different from the first view, in which a reference image of the second view is previously reconstructed. For at least one block of a current image of the first view, termed the current block, a motion information item associated with said current block and representative of a displacement of said current block in said previously reconstructed reference image, is obtained (E64). A prediction block is obtained (E66) on the basis of said previously reconstructed reference image of said second view and of said motion information item obtained. The current block is reconstructed (E68) on the basis of the prediction block, of an decoded prediction residual information item (E650) on the basis of the stream of coded data and of a difference information item calculated between a first block associated with the first view and a second block associated with the second view and decoded (E67) on the basis of the stream of coded data.},
keywords = {},
pubstate = {published},
tppubtype = {misc}
}
Maugey, T.; Petrazzuoli, G.; Frossard, P.; Cagnazzo, M.; Pesquet-Popescu, B.
Reference view selection in DIBR-based multiview coding Journal Article
In: IEEE TRANSACTIONS ON IMAGE PROCESSING, vol. 25, no. 4, pp. 1808–1819, 2016.
@article{11577_3469367,
title = {Reference view selection in DIBR-based multiview coding},
author = { T. Maugey and G. Petrazzuoli and P. Frossard and M. Cagnazzo and B. Pesquet-Popescu},
doi = {10.1109/TIP.2016.2530303},
year = {2016},
date = {2016-01-01},
journal = {IEEE TRANSACTIONS ON IMAGE PROCESSING},
volume = {25},
number = {4},
pages = {1808--1819},
publisher = {Institute of Electrical and Electronics Engineers Inc.},
abstract = {Augmented reality, interactive navigation in 3D scenes, multiview video, and other emerging multimedia applications require large sets of images, hence larger data volumes and increased resources compared with traditional video services. The significant increase in the number of images in multiview systems leads to new challenging problems in data representation and data transmission to provide high quality of experience on resource-constrained environments. In order to reduce the size of the data, different multiview video compression strategies have been proposed recently. Most of them use the concept of reference or key views that are used to estimate other images when there is high correlation in the data set. In such coding schemes, the two following questions become fundamental: 1) how many reference views have to be chosen for keeping a good reconstruction quality under coding cost constraints? And 2) where to place these key views in the multiview data set? As these questions are largely overlooked in the literature, we study the reference view selection problem and propose an algorithm for the optimal selection of reference views in multiview coding systems. Based on a novel metric that measures the similarity between the views, we formulate an optimization problem for the positioning of the reference views, such that both the distortion of the view reconstruction and the coding rate cost are minimized. We solve this new problem with a shortest path algorithm that determines both the optimal number of reference views and their positions in the image set. We experimentally validate our solution in a practical multiview distributed coding system and in the standardized 3D-HEVC multiview coding scheme. We show that considering the 3D scene geometry in the reference view, positioning problem brings significant rate-distortion improvements and outperforms the traditional coding strategy that simply selects key frames based on the distance between cameras.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Schretter, C.; Bettens, S.; Blinder, D.; Pesquet-Popescu, B.; Cagnazzo, M.; Dufaux, F.; Schelkens, P.
Compressed digital holography: From micro towards macro Conference
Proceedings of SPIE – The International Society for Optical Engineering, vol. 9971, SPIE, 2016.
@conference{11577_3469675,
title = {Compressed digital holography: From micro towards macro},
author = { C. Schretter and S. Bettens and D. Blinder and B. Pesquet-Popescu and M. Cagnazzo and F. Dufaux and P. Schelkens},
doi = {10.1117/12.2238761},
year = {2016},
date = {2016-01-01},
booktitle = {Proceedings of SPIE - The International Society for Optical Engineering},
volume = {9971},
publisher = {SPIE},
abstract = {The age of computational imaging is merging the physical hardware-driven approach of photonics with advanced signal processing methods from software-driven computer engineering and applied mathematics. The compressed sensing theory in particular established a practical framework for reconstructing the scene content using few linear combinations of complex measurements and a sparse prior for regularizing the solution. Compressed sensing found direct applications in digital holography for microscopy. Indeed, the wave propagation phenomenon in free space mixes in a natural way the spatial distribution of point sources from the 3-dimensional scene. As the 3-dimensional scene is mapped to a 2-dimensional hologram, the hologram samples form a compressed representation of the scene as well. This overview paper discusses contributions in the field of compressed digital holography at the micro scale. Then, an outreach on future extensions towards the real-size macro scale is discussed. Thanks to advances in sensor technologies, increasing computing power and the recent improvements in sparse digital signal processing, holographic modalities are on the verge of practical high-quality visualization at a macroscopic scale where much higher resolution holograms must be acquired and processed on the computer.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Dricot, A.; Jung, J.; Cagnazzo, M.; Pesquet, B.; Dufaux, F.
Improved integral images compression based on multi-view extraction Conference
Proceedings of SPIE – The International Society for Optical Engineering, vol. 9971, SPIE, 2016.
@conference{11577_3469364,
title = {Improved integral images compression based on multi-view extraction},
author = { A. Dricot and J. Jung and M. Cagnazzo and B. Pesquet and F. Dufaux},
doi = {10.1117/12.2238707},
year = {2016},
date = {2016-01-01},
booktitle = {Proceedings of SPIE - The International Society for Optical Engineering},
volume = {9971},
publisher = {SPIE},
abstract = {Integral imaging is a technology based on plenoptic photography that captures and samples the light-field of a scene through a micro-lens array. It provides views of the scene from several angles and therefore is foreseen as a key technology for future immersive video applications. However, integral images have a large resolution and a structure based on micro-images which is challenging to encode. A compression scheme for integral images based on view extraction has previously been proposed, with average BD-rate gains of 15.7% (up to 31.3%) reported over HEVC when using one single extracted view. As the efficiency of the scheme depends on a tradeoff between the bitrate required to encode the view and the quality of the image reconstructed from the view, it is proposed to increase the number of extracted views. Several configurations are tested with different positions and different number of extracted views. Compression efficiency is increased with average BD-rate gains of 22.2% (up to 31.1%) reported over the HEVC anchor, with a realistic runtime increase.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Zheng, S.; Antonini, M.; Cagnazzo, M.; Guerrieri, L.; Kieffer, M.; Nemoianu, I.; Samy, R.; Zhang, B.
Softcast with per-carrier power-constrained channels Conference
Proceedings – International Conference on Image Processing, ICIP, vol. 2016-, IEEE Computer Society, 2016.
@conference{11577_3469514,
title = {Softcast with per-carrier power-constrained channels},
author = { S. Zheng and M. Antonini and M. Cagnazzo and L. Guerrieri and M. Kieffer and I. Nemoianu and R. Samy and B. Zhang},
doi = {10.1109/ICIP.2016.7532733},
year = {2016},
date = {2016-01-01},
booktitle = {Proceedings - International Conference on Image Processing, ICIP},
volume = {2016-},
pages = {2122--2126},
publisher = {IEEE Computer Society},
abstract = {This paper considers the Softcast joint source-channel video coding scheme for data transmission over parallel channels with different power constraints and noise characteristics, typical in DSL or PLT channels. To minimize the mean square error at receiver, an optimal precoding matrix design problem has to be solved, which requires the solution of an inverse eigenvalue problem. Such solution is taken from the MIMO channel precoder design literature. Alternative suboptimal precoding matrices are also proposed and analyzed, showing the efficiency of the optimal precoding matrix within Softcast, which provides gains increasing with the encoded video quality.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Purica, A. I.; Cagnazzo, M.; Pesquet-Popescu, B.; Dufaux, F.; Ionesc, B.
View synthesis based on temporal prediction via warped motion vector fields Conference
ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing – Proceedings, vol. 2016-, Institute of Electrical and Electronics Engineers Inc., 2016.
@conference{11577_3469365,
title = {View synthesis based on temporal prediction via warped motion vector fields},
author = { A. I. Purica and M. Cagnazzo and B. Pesquet-Popescu and F. Dufaux and B. Ionesc},
doi = {10.1109/ICASSP.2016.7471856},
year = {2016},
date = {2016-01-01},
booktitle = {ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings},
volume = {2016-},
pages = {1150--1154},
publisher = {Institute of Electrical and Electronics Engineers Inc.},
abstract = {The demand for 3D content has increased over the last years as 3D displays are now widespread. View synthesis methods, such as depth-image-based-rendering, provide an efficient tool in 3D content creation or transmission, and are integrated in coding solutions for multiview video content such as 3D-HEVC. In this paper, we propose a view synthesis method that takes advantage of temporal and inter-view correlations in multiview video sequences. We use warped motion vector fields computed in reference views to obtain temporal predictions of a frame in a synthesized view and blend them with depth-image-based-rendering synthesis. Our method is shown to bring gains of 0.42dB in average when tested on several multiview sequences.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Calemme, M.; Cagnazzo, M.; Pesquet-Popescu, B.
Contour-Based Depth Coding: A Subjective Quality Assessment Study Conference
Proceedings – 2015 IEEE International Symposium on Multimedia, ISM 2015, Institute of Electrical and Electronics Engineers Inc., 2016, ISBN: 978-1-5090-0379-2.
@conference{11577_3469363,
title = {Contour-Based Depth Coding: A Subjective Quality Assessment Study},
author = { M. Calemme and M. Cagnazzo and B. Pesquet-Popescu},
doi = {10.1109/ISM.2015.34},
isbn = {978-1-5090-0379-2},
year = {2016},
date = {2016-01-01},
booktitle = {Proceedings - 2015 IEEE International Symposium on Multimedia, ISM 2015},
pages = {295--300},
publisher = {Institute of Electrical and Electronics Engineers Inc.},
abstract = {Multi-view video plus depth is emerging as the most flexible format for 3D video representation, as witnessed by the current standardization efforts by ISO and ITU. The depth information allows synthesizing virtual view points, and for its compression various techniques have been proposed. It is generally recognized that a high quality view rendering at the receiver side is possible only by preserving the contour information since distortions on edges during the encoding step would cause a sensible degradation on the synthesized view and on the 3D perception. As a consequence recent approaches include contour-based coding of depths. However, the impact of contour-preserving depth-coding on the perceived quality of synthesized images has not been conveniently studied. Therefore in this paper we make an investigation by means of a subjective study to better understand the limits and the potentialities of the different techniques. Our results show that the contour information is indeed relevant in the synthesis step: preserving the contours and coding coarsely the rest typically leads to images that users cannot tell apart from the reference ones, even at low bit rate. Moreover, our results show that objective metrics that are commonly used to evaluate synthesized images may have a low correlation coefficient with MOS rates and are in general not consistent across several techniques and contents.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Fiengo, A.; Chierchia, G.; Cagnazzo, M.; Pesquet-Popescu, B.
Convex optimization for frame-level rate allocation in MV-HEVC Conference
Proceedings – International Conference on Image Processing, ICIP, vol. 2016-, IEEE Computer Society, 2016.
@conference{11577_3469679,
title = {Convex optimization for frame-level rate allocation in MV-HEVC},
author = { A. Fiengo and G. Chierchia and M. Cagnazzo and B. Pesquet-Popescu},
doi = {10.1109/ICIP.2016.7532740},
year = {2016},
date = {2016-01-01},
booktitle = {Proceedings - International Conference on Image Processing, ICIP},
volume = {2016-},
pages = {2157--2161},
publisher = {IEEE Computer Society},
abstract = {Optimal rate allocation is among the most challenging tasks to perform in the context of multi-view video coding, because of the dependency between frames induced by motion compensation and depth image-based rendering. In this paper, using a recursive rate-distortion model that explicitly takes into account these dependencies, we approach the frame-level rate allocation as a convex optimization problem. Within this framework, we provide an efficient algorithm for exactly solving the above problem with recent convex optimization tools. Experiments on standard sequences demonstrate the interest of considering the proposed rate allocation method and confirm that our approach ensures a better performance (in ratedistortion sense) than the standard MV-HEVC rate control.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Purica, A. I.; Mora, E. G.; Pesquet-Popescu, B.; Cagnazzo, M.; Ionescu, B.
Multiview Plus Depth Video Coding with Temporal Prediction View Synthesis Journal Article
In: IEEE TRANSACTIONS ON CIRCUITS AND SYSTEMS FOR VIDEO TECHNOLOGY, vol. 26, no. 2, pp. 360–374, 2016.
@article{11577_3469368,
title = {Multiview Plus Depth Video Coding with Temporal Prediction View Synthesis},
author = { A. I. Purica and E. G. Mora and B. Pesquet-Popescu and M. Cagnazzo and B. Ionescu},
doi = {10.1109/TCSVT.2015.2389511},
year = {2016},
date = {2016-01-01},
journal = {IEEE TRANSACTIONS ON CIRCUITS AND SYSTEMS FOR VIDEO TECHNOLOGY},
volume = {26},
number = {2},
pages = {360--374},
publisher = {Institute of Electrical and Electronics Engineers Inc.},
abstract = {Multiview video (MVV) plus depths formats use view synthesis to build intermediate views from existing adjacent views at the receiver side. Traditional view synthesis exploits the disparity information to interpolate an intermediate view by considered inter-view correlations. However, temporal correlation between different frames of the intermediate view can be used to improve the synthesis. We propose a new coding scheme for 3-D High Efficiency Video Coding (HEVC) that allows us to take full advantage of temporal correlations in the intermediate view and improve the existing synthesis from adjacent views. We use optical flow techniques to derive dense motion vector fields (MVF) from the adjacent views and then warp them at the level of the intermediate view. This allows us to construct multiple temporal predictions of the synthesized frame. A second contribution is an adaptive fusion method that judiciously selects between temporal and inter-view prediction to eliminate artifacts associated with each prediction type. The proposed system is compared against the state-of-the-art view synthesis reference software 1-D Fast technique used in 3-D HEVC standardization. Three intermediary views are synthesized. Gains of up to 1.21-dB Bjontegaard Delta peak SNR are shown when evaluated on several standard MVV test sequences.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Purica, A. I.; Cagnazzo, M.; Pesquet-Popescu, B.; Dufaux, F.; Ionescu, B.
A distortion evaluation framework in 3D video view synthesis Conference
2015 International Conference on 3D Imaging, IC3D 2015 – Proceedings, Institute of Electrical and Electronics Engineers Inc., 2016, ISBN: 978-1-5090-1265-7.
@conference{11577_3469678,
title = {A distortion evaluation framework in 3D video view synthesis},
author = { A. I. Purica and M. Cagnazzo and B. Pesquet-Popescu and F. Dufaux and B. Ionescu},
doi = {10.1109/IC3D.2015.7391827},
isbn = {978-1-5090-1265-7},
year = {2016},
date = {2016-01-01},
booktitle = {2015 International Conference on 3D Imaging, IC3D 2015 - Proceedings},
pages = {1--8},
publisher = {Institute of Electrical and Electronics Engineers Inc.},
abstract = {Demand for 3D content increased over the last years and more attention was dedicated to methods used in 3D content creation and transmission. View synthesis methods introduce localized artifacts when creating new virtual views. Evaluating these methods require therefore a different approach, in order to identify and emphasize synthesis artifact prone areas, while diminishing the impact, of other types of artifacts, such as those produced by quantization during the video coding. In this paper, we propose an artifact evaluation technique which was shown to provide a better differentiation of synthesis methods, while additional information can be extrapolated from the results about the spatial localization of typical synthesis artifacts and their impact on overall image quality.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Greco, C.; Nemoianu, I. D.; Cagnazzo, M.; Pesquet-Popescu, B.
Rate-distortion-optimized multi-view streaming in wireless environment using network coding Journal Article
In: EURASIP JOURNAL ON ADVANCES IN SIGNAL PROCESSING, vol. 2016, no. 1, pp. 1–20, 2016.
@article{11577_3469269,
title = {Rate-distortion-optimized multi-view streaming in wireless environment using network coding},
author = { C. Greco and I. D. Nemoianu and M. Cagnazzo and B. Pesquet-Popescu},
doi = {10.1186/s13634-016-0308-4},
year = {2016},
date = {2016-01-01},
journal = {EURASIP JOURNAL ON ADVANCES IN SIGNAL PROCESSING},
volume = {2016},
number = {1},
pages = {1--20},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
2015
Jung, Joel; Dricot, Antoine; Cagnazzo, Marco; PESQUET-POPESCU, Beatrice; Dufaux, Frederic
CODAGE/DECODAGE PREDICTIF D’IMAGES COMPORTANT UN ARTEFACT, UTILISANT UNE EXTRAPOLATION Miscellaneous
2015.
@misc{11577_3472320,
title = {CODAGE/DECODAGE PREDICTIF D'IMAGES COMPORTANT UN ARTEFACT, UTILISANT UNE EXTRAPOLATION},
author = { Joel Jung and Antoine Dricot and Marco Cagnazzo and Beatrice PESQUET-POPESCU and Frederic Dufaux},
year = {2015},
date = {2015-01-01},
abstract = {L'invention concerne un codage/décodage par prédiction d'un bloc courant d'au moins une image courante, dans lequel on obtient un vecteur de mouvement (mv) pointant vers un bloc de référence (bref) d'une zone de pixels préalablement décodée, ladite zone de pixels comportant un artéfact ayant une position déterminée. En particulier : - on détermine (S3), en fonction de la position de l'artéfact dans ladite zone de pixels, si le bloc de référence comporte au moins une partie de l'artéfact, - le cas échéant, on corrige (S4) le bloc de référence en corrigeant des pixels au moins de ladite partie de l'artéfact par extrapolation à partir d'autres pixels de ladite zone de pixels, et - on utilise le bloc de référence corrigé (bref*) pour le décodage (S6) par prédiction.},
keywords = {},
pubstate = {published},
tppubtype = {misc}
}
Dricot, A.; Jung, J.; Cagnazzo, M.; Pesquet, B.; Dufaux, F.; Kovacs, P. T.; Adhikarla, V. K.
Subjective evaluation of Super Multi-View compressed contents on high-end light-field 3D displays Journal Article
In: SIGNAL PROCESSING-IMAGE COMMUNICATION, vol. 39, pp. 369–385, 2015.
@article{11577_3469366,
title = {Subjective evaluation of Super Multi-View compressed contents on high-end light-field 3D displays},
author = { A. Dricot and J. Jung and M. Cagnazzo and B. Pesquet and F. Dufaux and P. T. Kovacs and V. K. Adhikarla},
doi = {10.1016/j.image.2015.04.012},
year = {2015},
date = {2015-01-01},
journal = {SIGNAL PROCESSING-IMAGE COMMUNICATION},
volume = {39},
pages = {369--385},
publisher = {Elsevier B.V.},
abstract = {Super Multi-View (SMV) video content is composed of tens or hundreds of views that provide a light-field representation of a scene. This representation allows a glass-free visualization and eliminates many causes of discomfort existing in current available 3D video technologies. Efficient video compression of SMV content is a key factor for enabling future 3D video services. This paper first compares several coding configurations for SMV content and several inter-view prediction structures are also tested and compared. The experiments mainly suggest that large differences in coding efficiency can be observed from one configuration to another. Several ratios for the number of coded and synthesized views are compared, both objectively and subjectively. It is reported that view synthesis significantly affects the coding scheme. The amount of views to skip highly depends on the sequence and on the quality of the associated depth maps. Reported ranges of bitrates required to obtain a good quality for the tested SMV content are realistic and coherent with future 4 K/8 K needs. The reliability of the PSNR metric for SMV content is also studied. Objective and subjective results show that PSNR is able to reflect increase or decrease in subjective quality even in the presence of synthesized views. However, depending on the ratio of coded and synthesized views, the order of magnitude of the effective quality variation is biased by PSNR. Results indicate that PSNR is less tolerant to view synthesis artifacts than human viewers. Finally, preliminary observations are initiated. First, the light-field conversion step does not seem to alter the objective results for compression. Secondly, the motion parallax does not seem to be impacted by specific compression artifacts. The perception of the motion parallax is only altered by variations of the typical compression artifacts along the viewing angle, in cases where the subjective image quality is already low. To the best of our knowledge, this paper is the first to carry out subjective experiments and to report results of SMV compression for light-field 3D displays. It provides first results showing that improvement of compression efficiency is required, as well as depth estimation and view synthesis algorithms improvement, but that the use of SMV appears realistic according to next generation compression technology requirements.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Maugey, T.; Petrazzuoli, G.; Frossard, P.; Cagnazzo, M.; Pesquet-Popescu, B.
Key view selection in distributed multiview coding Conference
2014 IEEE Visual Communications and Image Processing Conference, VCIP 2014, Institute of Electrical and Electronics Engineers Inc., 2015, ISBN: 978-1-4799-6139-9.
@conference{11577_3469672,
title = {Key view selection in distributed multiview coding},
author = { T. Maugey and G. Petrazzuoli and P. Frossard and M. Cagnazzo and B. Pesquet-Popescu},
doi = {10.1109/VCIP.2014.7051612},
isbn = {978-1-4799-6139-9},
year = {2015},
date = {2015-01-01},
booktitle = {2014 IEEE Visual Communications and Image Processing Conference, VCIP 2014},
pages = {486--487},
publisher = {Institute of Electrical and Electronics Engineers Inc.},
abstract = {Multiview image and video systems with large number of views lead to new problems in data representation, transmission and user interaction. In order to reduce the data volumes, most distributed multiview coding schemes exploit the inter-view redundancies at the decoder side, using view synthesis from key views. In the situation where many views are considered, the two following questions become fundamental: i) how many key views have to be chosen for keeping a good reconstruction quality with reasonable coding cost? ii) where to place them optimally in the multiview sequences? We propose in this paper an algorithm for selecting the key views in a distributed multiview coding scheme. Based on a novel metric for the correlation between the views, we formulate an optimization problem for the positioning of the key views such that both the distortion of the reconstruction and the coding rate cost are effectively minimized. We then propose a new optimization strategy based on shortest path algorithm that permits to determine both the optimal number of key views and their positions in the image set. We experimentally validate our solution in a practical distributed multiview coding system and we show that considering the 3D scene geometry in the key view positioning brings significant rate-distortion improvements compared to distance-based key view selection as it is commonly done in the literature.},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}