@incollection{fdi:010073007, title = {{C}leaning, integrating, and warehousing genomic data from biomedical resources}, author = {{M}oussouni, {F}. and {B}erti-{E}quille, {L}aure}, editor = {}, language = {{ENG}}, abstract = {{I}n this chapter, the authors review the literature on data integration in the life sciences with a particular focus on the approaches that have been proposed to handle biological data quality problems. {T}hey propose a classification of data quality problems in biomedical resources and present some of preprocessing solutions that can be practically implemented before any data‐mining task. {B}ased on their previous work on data cleaning, integration, and warehousing of biomedical data, they present the lessons they have learned and the approaches implemented in practice. {F}inally, they conclude with some challenging research directions for biomedical data preprocessing and integration.}, keywords = {{INFORMATIQUE} {SCIENTIFIQUE} ; {BANQUE} {DE} {DONNEES} ; {TRAITEMENT} {DE} {DONNEES} ; {QUALITE} ; {BIOLOGIE} ; {SANTE} ; {BIOINFORMATIQUE} ; {GENOMIQUE} ; {ONTOLOGIE}}, booktitle = {{B}iological knowledge discovery handbook}, numero = {23}, pages = {35--58}, address = {{H}oboken}, publisher = {{W}iley}, series = {{W}iley {B}ook {S}eries on {B}ioinformatics}, year = {2014}, DOI = {10.1002/9781118617151.ch02}, ISBN = {978-1-118-13273-9}, URL = {https://www.documentation.ird.fr/hor/fdi:010073007}, }