@article{641, author = {Zaid Zada and Samuel Nastase and Bobbi Aubrey and Itamar Jalon and Sebastian Michelmann and Haocheng Wang and Liat Hasenfratz and Werner Doyle and Daniel Friedman and Patricia Dugan and Lucia Melloni and Sasha Devore and Adeen Flinker and Orrin Devinsky and Ariel Goldstein and Uri Hasson}, title = {The "Podcast" ECoG dataset for modeling neural activity during natural language comprehension.}, abstract = {
Naturalistic electrocorticography (ECoG) data are a rare but essential resource for studying the brain{\textquoteright}s linguistic capabilities. ECoG offers high temporal resolution suitable for investigating processes at multiple temporal timescales and frequency bands. It also provides broad spatial coverage, often along critical language areas. Here, we share a dataset of nine ECoG participants with 1,330 electrodes listening to a 30-minute audio podcast. The richness of this naturalistic stimulus can be used for various research questions, from auditory perception to narrative integration. In addition to the neural data, we extracted linguistic features of the stimulus ranging from phonetic information to large language model word embeddings. We use these linguistic features in encoding models that relate stimulus properties to neural activity. Finally, we provide detailed tutorials for preprocessing raw data, extracting stimulus features, and running encoding analyses that can serve as a pedagogical resource or a springboard for new research.
}, year = {2025}, journal = {Scientific data}, volume = {12}, pages = {1135}, month = {07/2025}, issn = {2052-4463}, doi = {10.1038/s41597-025-05462-2}, language = {eng}, }