@article{fdi:010073027, title = {{D}raft genome and reference transcriptomic resources for the urticating pine defoliator {T}haumetopoea pityocampa ({L}epidoptera : {N}otodontidae)}, author = {{G}schloessl, {B}. and {D}orkeld, {F}. and {B}erges, {H}. and {B}eydon, {G}. and {B}ouchez, {O}. and {B}ranco, {M}. and {B}retaudeau, {A}. and {B}urban, {C}. and {D}ubois, {E}. and {G}authier, {P}hilippe and {L}huillier, {E}. and {N}ichols, {J}. and {N}idelet, {S}. and {R}ocha, {S}. and {S}aune, {L}. and {S}treiff, {R}. and {G}autier, {M}. and {K}erdelhue, {C}.}, editor = {}, language = {{ENG}}, abstract = {{T}he pine processionary moth {T}haumetopoea pityocampa ({L}epidoptera: {N}otodontidae) is the main pine defoliator in the {M}editerranean region. {I}ts urticating larvae cause severe human and animal health concerns in the invaded areas. {T}his species shows a high phenotypic variability for various traits, such as phenology, fecundity and tolerance to extreme temperatures. {T}his study presents the construction and analysis of extensive genomic and transcriptomic resources, which are an obligate prerequisite to understand their underlying genetic architecture. {U}sing a well-studied population from {P}ortugal with peculiar phenological characteristics, the karyotype was first determined and a first draft genome of 537{M}b total length was assembled into 68,292 scaffolds ({N}50 = 164kb). {F}rom this genome assembly, 29,415 coding genes were predicted. {T}o circumvent some limitations for fine-scale physical mapping of genomic regions of interest, a 3{X} coverage {BAC} library was also developed. {I}n particular, 11 {BAC}s from this library were individually sequenced to assess the assembly quality. {A}dditionally, de novo transcriptomic resources were generated from various developmental stages sequenced with {H}i{S}eq and {M}i{S}eq {I}llumina technologies. {T}he reads were de novo assembled into 62,376 and 63,175 transcripts, respectively. {T}hen, a robust subset of the genome-predicted coding genes, the de novo transcriptome assemblies and previously published 454/{S}anger data were clustered to obtain a high-quality and comprehensive reference transcriptome consisting of 29,701 bona fide unigenes. {T}hese sequences covered 99% of the cegma and 88% of the busco highly conserved eukaryotic genes and 84% of the busco arthropod gene set. {M}oreover, 90% of these transcripts could be localized on the draft genome. {T}he described information is available via a genome annotation portal (}, keywords = {{BAC} library ; de novo assembly ; gene prediction ; genome ; {L}epidoptera ; transcriptome}, booktitle = {}, journal = {{M}olecular {E}cology {R}esources}, volume = {18}, numero = {3}, pages = {602--619}, ISSN = {1755-098{X}}, year = {2018}, DOI = {10.1111/1755-0998.12756}, URL = {https://www.documentation.ird.fr/hor/fdi:010073027}, }