<?xml version='1.0' encoding='UTF-8'?><rss xmlns:atom="http://www.w3.org/2005/Atom" xmlns:openSearch="http://a9.com/-/spec/opensearchrss/1.0/" xmlns:blogger="http://schemas.google.com/blogger/2008" xmlns:georss="http://www.georss.org/georss" xmlns:gd="http://schemas.google.com/g/2005" xmlns:thr="http://purl.org/syndication/thread/1.0" version="2.0"><channel><atom:id>tag:blogger.com,1999:blog-8099840</atom:id><lastBuildDate>Sun, 15 Feb 2026 00:00:39 +0000</lastBuildDate><category>Genomics</category><category>Staphylococcus aureus</category><category>Bacteria</category><category>Modernising Medical Microbiology</category><category>Selection</category><category>GWAS</category><category>COVID-19</category><category>Statistics</category><category>Antibiotics</category><category>Campylobacter jejuni</category><category>Derrick Crook</category><category>Mycobacterium tuberculosis</category><category>Postdoc</category><category>Recruitment</category><category>Virulogenomics</category><category>Clostridium difficile</category><category>Evolution</category><category>Microbiology</category><category>Nicolas Arning</category><category>Phylogenetics</category><category>Bernadette Young</category><category>Big Data Institute</category><category>Harmonic mean p-value</category><category>Nuffield Department of Medicine</category><category>Antimicrobial resistance</category><category>Machine learning</category><category>Population Genetics</category><category>Recombination</category><category>Royal Society</category><category>SMBE</category><category>Sam Sheppard</category><category>Transmission</category><category>Bethany Dearlove</category><category>CRyPTIC</category><category>David Eyre</category><category>Doublethink</category><category>Epidemiology</category><category>Escherichia coli</category><category>Helen Fryer</category><category>Oxford</category><category>PLoS Genetics</category><category>PNAS</category><category>Public Engagement</category><category>Public Health England</category><category>Publishing</category><category>Rory Bowden</category><category>Ruth Massey</category><category>UK Biobank</category><category>Wellcome Trust</category><category>omegaMap</category><category>BEAST</category><category>Bill &amp; Melinda Gates Foundation</category><category>Bonferroni correction</category><category>David Wyllie</category><category>Drosophila</category><category>FDR</category><category>FWER</category><category>HIV</category><category>Hepatitis C</category><category>Human Evolution</category><category>Jessie Wu</category><category>Lab business</category><category>MRC</category><category>PLoS Computational Biology</category><category>PLoS Pathogens</category><category>Peter Andolfatto</category><category>PhD studentship</category><category>Presentations</category><category>Sarah Walker</category><category>Tim Peto</category><category>Adaptation</category><category>Andrew Rambaut</category><category>Artificial intelligence</category><category>Bioinformatics</category><category>COVID-19 Host Genetics Initiative</category><category>Cheltenham Science Festival</category><category>Christophe Fraser</category><category>Claudia Lindemann</category><category>Conference</category><category>David Clifton</category><category>Jessica Hedge</category><category>Martin Fraunholz</category><category>Martin Maiden</category><category>Metagenomics</category><category>Microbial Genomics</category><category>Molecular Biology and Evolution</category><category>Molly Przeworski</category><category>Neisseria meningitidis</category><category>New England Journal of Medicine</category><category>Newton Fund</category><category>Nicola De Maio</category><category>Nuffield Department of Population Health</category><category>Oxford Martin School</category><category>PLoS Biology</category><category>Petra Mullner</category><category>Phylogeography</category><category>Pseudomonas aeruginosa</category><category>Research</category><category>SCOTTI</category><category>Sarah Earle</category><category>Society for Molecular Biology and Evolution</category><category>Stephen Bentley</category><category>Tanya Golubchik</category><category>Teaching</category><category>Xavier Dideleot</category><category>correction</category><category>eLife</category><category>malaria</category><category>norovirus</category><category>software</category><category>Adam Eyre-Walker</category><category>Adi Alon</category><category>Ashleigh Griffin</category><category>Ashley Robinson</category><category>Association Studies</category><category>Australia</category><category>BBSRC</category><category>Benjamini-Hochberg procedure</category><category>Beth Gibson</category><category>BioHPC</category><category>British Museum</category><category>Cambodia</category><category>Campylobacter coli</category><category>Carina Brehony</category><category>Caroline Buckee</category><category>Catrin Moore</category><category>Chris Spencer</category><category>Christoph Tang</category><category>ClonalFrameML</category><category>Coalescent</category><category>Continuing Education</category><category>Daniel Falush</category><category>Data Science</category><category>Dominic Kwiatkowski</category><category>Down&#39;s syndrome</category><category>Ebola</category><category>Ed Feil</category><category>Edith Gabriel</category><category>Eduardo Rocha</category><category>Eukaryotes</category><category>ExWAS</category><category>Faculty of 1000</category><category>Festival of Genomics</category><category>Food-borne disease</category><category>Genome Biology</category><category>Graham Coop</category><category>Grenoble</category><category>Hutterites</category><category>IJ Good</category><category>ISME Journal</category><category>Infection</category><category>Institut Pasteur</category><category>Institute for Emerging Infections</category><category>Jane Charlesworth</category><category>John Lees</category><category>Journal Club</category><category>Kathleen O&#39;Reilly</category><category>Kilifi</category><category>Klebsiella pneumoniae</category><category>Kyle Knox</category><category>Lancaster</category><category>Lev Landau</category><category>Liz Batty</category><category>Lluis Quintana-Murci</category><category>Luis Barreiro</category><category>Madeleine Cule</category><category>Mark Smeltzer</category><category>Me</category><category>NERC</category><category>NIHR</category><category>Nanopore</category><category>Nature Communications</category><category>Nature Microbiology</category><category>Nature Reviews Genetics</category><category>Nature Reviews Microbiology</category><category>Neolithic</category><category>New York</category><category>Nicholas Thompson</category><category>Nicole Stoesser</category><category>Nigel French</category><category>Olduvai Gorge</category><category>Oliver Pybus</category><category>OxBRC</category><category>Oxford Tropical Network</category><category>PLoS ONE</category><category>Palaeontology</category><category>Panton Valentine Leukocidin</category><category>Paul Keim</category><category>Paul Sharp</category><category>Peer Review</category><category>Peter Ralph</category><category>Phillipe Glaser</category><category>Pierre Mahe</category><category>Prize</category><category>ProbGen</category><category>Proceedings B</category><category>Pseudogenes</category><category>Resistance</category><category>Review</category><category>Richard Everitt</category><category>Robertson Foundation</category><category>Rosalind Harding</category><category>Ryan Hernandez</category><category>Salmonella enterica</category><category>Science</category><category>Science Bomb</category><category>Science Museum</category><category>Simes procedure</category><category>Sir Henry Dale Fellowship</category><category>Society for General Microbiology</category><category>St. John&#39;s College</category><category>Statistical Genomics Summer School</category><category>Streptococcus pneumoniae</category><category>Sudip Das</category><category>Summer Science Exhibition</category><category>Talk</category><category>Tarek Msadek</category><category>Toll-like receptors</category><category>Tool Use</category><category>Trends in Microbiology</category><category>Vibrio cholerae</category><category>Vibrionaceae</category><category>Viruses</category><category>Wellcome Open Research</category><category>Wellcome Trust Sanger Institute</category><category>World Health Day</category><category>Xavier Didelot</category><category>Zika virus</category><category>Zoonosis</category><category>antigens</category><category>codeml</category><category>combined tests</category><category>doubling time</category><category>false discovery rate</category><category>family-wise error rate</category><category>gammaMap</category><category>genomegaMap</category><category>hypothesis testing</category><category>lockdown</category><category>lyre bird</category><category>mGen</category><category>macaques</category><category>meiosis</category><category>meningitis</category><category>mkprf</category><category>mutation</category><category>p-values</category><category>pedigrees</category><category>pyomyositis</category><category>vaccines</category><category>var</category><category>vin</category><title>Daniel Wilson&#39;s Blog</title><description>Research in Population Genomics</description><link>http://blog.danielwilson.me.uk/</link><managingEditor>noreply@blogger.com (Daniel Wilson)</managingEditor><generator>Blogger</generator><openSearch:totalResults>100</openSearch:totalResults><openSearch:startIndex>1</openSearch:startIndex><openSearch:itemsPerPage>25</openSearch:itemsPerPage><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-5789335442300850984</guid><pubDate>Mon, 05 Jan 2026 09:37:00 +0000</pubDate><atom:updated>2026-01-05T03:37:03.354-06:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">COVID-19</category><category domain="http://www.blogger.com/atom/ns#">Doublethink</category><category domain="http://www.blogger.com/atom/ns#">ExWAS</category><category domain="http://www.blogger.com/atom/ns#">Helen Fryer</category><category domain="http://www.blogger.com/atom/ns#">Nicolas Arning</category><category domain="http://www.blogger.com/atom/ns#">UK Biobank</category><title>New paper: Identifying direct risk factors for COVID-19 hospitalization in UK Biobank using Doublethink</title><description>&lt;p&gt;This week sees publication of our new paper&amp;nbsp;&lt;b&gt;&lt;a href=&quot;https://www.pnas.org/doi/full/10.1073/pnas.2514138122&quot;&gt;Identifying direct risk factors in UK Biobank via simultaneous Bayesian-frequentist model-averaged hypothesis testing using Doublethink&lt;/a&gt;&lt;/b&gt; in&amp;nbsp;&lt;i&gt;Proceedings of the National Academy of Sciences (PNAS)&lt;/i&gt;. This work was joint with &lt;a href=&quot;https://www.google.com/url?sa=t&amp;amp;source=web&amp;amp;rct=j&amp;amp;opi=89978449&amp;amp;url=https://de.linkedin.com/in/nicolas-arning&amp;amp;ved=2ahUKEwjohab1i_SRAxUvWkEAHeHHDpAQFnoECBwQAQ&amp;amp;usg=AOvVaw0ZzXaAmFq9AiCY6byS02ix&quot;&gt;Nicolas Arning&lt;/a&gt; and &lt;a href=&quot;https://www.linkedin.com/in/helen-fryer-626b564a&quot;&gt;Helen Fryer&lt;/a&gt;.&lt;/p&gt;&lt;p&gt;In this study we applied a novel approach called &lt;a href=&quot;https://www.danielwilson.me.uk/abstracts/fryer_etal_2024.html&quot;&gt;Doublehthink&lt;/a&gt; to implement an exposome-wide association study (ExWAS) of non-genetic risk factors that influence risk of COVID-19 hospitalization in UK Biobank (UKB). Inspired by Bayesian model averaging, our approach enhances power by testing both individual variables and arbitrary groups of variables.&lt;/p&gt;&lt;p&gt;We employed Doublethink to reveal exposome-wide significant signals across nine individual variables and seven groups of variables, notably factors like aging, dementia and prior infection overlooked by 85% of previous studies of the UK Biobank. We found significant direct effects among some commonly reported risk factors like age, sex, and obesity, but not others like cardiovascular disease. The effects of hypertension, depression, and diabetes appeared to be mediated via general comorbidity.&amp;nbsp;&lt;/p&gt;&lt;p&gt;&lt;a href=&quot;https://www.pnas.org/doi/full/10.1073/pnas.2514138122#fig01&quot;&gt;&lt;img alt=&quot;Graph of variables with direct effects on COVID-19 hospitalization risk in UK Biobank, quantified by log sub 10 posterior odds and adjusted P-value.&quot; data-index=&quot;0&quot; data-open=&quot;viewer&quot; data-target=&quot;core-fv-fig01&quot; height=&quot;357&quot; loading=&quot;lazy&quot; src=&quot;https://www.pnas.org/cms/10.1073/pnas.2514138122/asset/e2a54cbd-b112-4746-a3e3-762282025bdf/assets/images/large/pnas.2514138122fig01.jpg&quot; width=&quot;640&quot; /&gt;&lt;/a&gt;&lt;/p&gt;&lt;p&gt;Biobank-scale epidemiology has transformed the study of common diseases, particularly through the discovery of genetic risk factors using genome-wide association studies (GWAS) methods. ExWAS applies similiar logic to pursue agnostic, data-driven discovery of non-genetic risk factors.&lt;/p&gt;&lt;p&gt;Doublethink offers an ExWAS method that can test thousands of variables in hundreds of thousands of UK Biobank participants. It controls both Bayesian (false discovery rate; FDR) and classical (familywise error rate; FWER) measures of false positives. Its Bayesian model-averaging approach enables an agnostic approach to variable selection, but it also addresses drawbacks of Bayesian methods like computational burden and reliance on prior assumptions for its false positive control.&lt;/p&gt;&lt;p&gt;Through its capacity to interpret biobank-scale data, our new Doublethink-based ExWAS approach paves the way for future systematic analyses of risk factors for infectious and chronic diseases in UK Biobank and beyond.&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2026/01/new-paper-identifying-direct-risk.html</link><author>noreply@blogger.com (Daniel Wilson)</author><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-2481872185514402810</guid><pubDate>Tue, 14 Oct 2025 09:47:00 +0000</pubDate><atom:updated>2025-10-14T04:48:51.104-05:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">David Eyre</category><category domain="http://www.blogger.com/atom/ns#">Genome Biology</category><category domain="http://www.blogger.com/atom/ns#">Machine learning</category><category domain="http://www.blogger.com/atom/ns#">Nicolas Arning</category><category domain="http://www.blogger.com/atom/ns#">Sam Sheppard</category><category domain="http://www.blogger.com/atom/ns#">Statistics</category><title>New paper: Machine learning and statistical inference in microbial population genomics</title><description>&lt;p&gt;We have published a new &lt;a href=&quot;https://genomebiology.biomedcentral.com/articles/10.1186/s13059-025-03775-4&quot;&gt;review article in Genome Biology&lt;/a&gt; contrasting machine learning and statistics in microbial genomics. This is joint work with &lt;a href=&quot;https://www.biology.ox.ac.uk/people/samuel-sheppard&quot;&gt;Sam Sheppard&lt;/a&gt;, &lt;a href=&quot;https://www.danielwilson.me.uk/lab.html&quot;&gt;Nick Arning&lt;/a&gt; and &lt;a href=&quot;https://www.bdi.ox.ac.uk/Team/david-eyre&quot;&gt;David Eyre&lt;/a&gt;.&lt;/p&gt;&lt;p&gt;The availability of large genome datasets has changed the microbiology research landscape. Analyzing such data requires computationally demanding analyses, and new approaches have come from different data analysis philosophies. Machine learning and statistical inference have overlapping knowledge discovery aims and approaches.&lt;/p&gt;&lt;p&gt;In this review, we highlight how machine learning focuses on optimizing prediction, whereas statistical inference focuses on understanding the processes relating variables. We outline the different aims, assumptions, and resulting methodologies, with examples from microbial genomics. These approaches are essentially complementary, and we argue that exploiting both machine learning and statistics - selecting the right tool for the job - has the greatest potential for advancing pathogen research in the big data era.&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2025/10/new-paper-machine-learning-and.html</link><author>noreply@blogger.com (Daniel Wilson)</author><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-5928892906370478409</guid><pubDate>Mon, 12 May 2025 10:16:00 +0000</pubDate><atom:updated>2025-05-20T00:56:22.558-05:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Doublethink</category><category domain="http://www.blogger.com/atom/ns#">FDR</category><category domain="http://www.blogger.com/atom/ns#">FWER</category><category domain="http://www.blogger.com/atom/ns#">Harmonic mean p-value</category><category domain="http://www.blogger.com/atom/ns#">Helen Fryer</category><category domain="http://www.blogger.com/atom/ns#">hypothesis testing</category><category domain="http://www.blogger.com/atom/ns#">Nicolas Arning</category><category domain="http://www.blogger.com/atom/ns#">Statistics</category><title>Doublethink: simultaneous Bayesian-frequentist model-averaged hypothesis testing</title><description>Helen Fryer, Nick Arning and I have posted our new preprint to &lt;a href=&quot;https://arxiv.org/abs/2312.17566&quot; target=&quot;_blank&quot;&gt;arxiv&lt;/a&gt;. This is the first version of the paper that we have submitted for peer review. Doublethink addresses some long-standing questions in assessing evidence for the purposes of hypothesis testing.&lt;div&gt;&lt;br /&gt;&lt;/div&gt;&lt;div&gt;Hypothesis testing is central to scientific enquiry, but conclusions can be heavily influenced by model specification, particularly which variables are included. Bayesian model-averaged hypothesis testing offers a solution, but the sensitivity of posterior odds and Bayesian false discovery rate (FDR) guarantees to prior assumptions limit the appeal. In hypothesis testing, we lack unifying results – like Bernstein-von-Mises’ Theorem – that predict convergence of Bayesian and frequentist results, even in large samples.&lt;/div&gt;&lt;div&gt;&lt;br /&gt;&lt;/div&gt;&lt;div&gt;Our paper introduces new theory and a practical method, &lt;i&gt;Doublethink&lt;/i&gt;, motivated by these issues:&lt;/div&gt;&lt;div&gt;&lt;ul style=&quot;text-align: left;&quot;&gt;&lt;li&gt;A key, and perhaps surprising, result is that Bayesian model-averaged hypothesis testing natively controls not only the Bayesian FDR, but also the frequentist strong-sense familywise error rate (FWER). This duality – which is general – seems to be unknown, or forgotten.&lt;/li&gt;&lt;li&gt;For practical application, we derive large-sample asymptotic theory to quantify the rate at which the FWER is controlled. Specifically, we use a BIC-like model to characterize the tail probability of the model-averaged posterior odds via a chi-squared distribution.&lt;/li&gt;&lt;/ul&gt;&lt;div class=&quot;separator&quot; style=&quot;clear: both; text-align: center;&quot;&gt;&lt;a href=&quot;#define-variables&quot; style=&quot;margin-left: 1em; margin-right: 1em;&quot;&gt;&lt;img border=&quot;0&quot; data-original-height=&quot;190&quot; data-original-width=&quot;1460&quot; height=&quot;53&quot; src=&quot;https://blogger.googleusercontent.com/img/b/R29vZ2xl/AVvXsEiOwQIIOEMLlhoaase7IV3Zp98FXcWKlx-Om4jXd4BXGpcRY_j1Z7Uun8VSGUAEmAPIF03rCeDBCHMl356C3tpLhTiltJ4tF2U1Y18XF3Yb-50-zN1kV3GlM3T9zigM3srULvUUTvPKKHvUgWyLxxuSpnh4Sr3PvzGuhe_VRfQd8u_SMPtTUl3c/w400-h53/Screenshot%202025-05-12%20at%2011.06.04.png&quot; width=&quot;400&quot; /&gt;&lt;/a&gt;&lt;/div&gt;&lt;ul style=&quot;text-align: left;&quot;&gt;&lt;li&gt;This result enables simultaneous control of Bayesian FDR and frequentist FWER at quantifiable levels and – equivalently – simultaneous reporting of posterior odds and asymptotic &lt;i&gt;p&lt;/i&gt;-values.&lt;/li&gt;&lt;li&gt;We explore the method’s benefits – like&lt;i&gt; post-hoc&lt;/i&gt; variable selection – and limitations – like inflation – through a Mendelian Randomization study and detailed simulations, comparing Doublethink to Lasso, stepwise regression, the Benjamini-Hochberg procedure and &lt;i&gt;e&lt;/i&gt;-values.&lt;/li&gt;&lt;/ul&gt;&lt;/div&gt;&lt;div&gt;Besides the practical benefits of model-averaged hypothesis testing with frequentist guarantees, and the implications that entails for objective Bayesian hypothesis testing, these results offer fundamental insights likely to trigger renewed discussion of FDR, FWER and the reconcilability of &lt;i&gt;p&lt;/i&gt;-values with evidence.&lt;/div&gt;&lt;div&gt;&lt;br /&gt;&lt;/div&gt;&lt;div&gt;&lt;div&gt;Doublethink is a novel addition to the emerging class of heavy-tailed combination tests. Since 2019, methods like the Cauchy combination test and harmonic mean &lt;i&gt;p&lt;/i&gt;-value have surfaced as powerful tools for combining hypothesis tests despite inter-test dependence. Doublethink improves on these methods by allowing model uncertainty in the null hypothesis and by improving power.&lt;/div&gt;&lt;div&gt;&lt;br /&gt;&lt;/div&gt;&lt;div&gt;We believe this paper will be of broad interest, addressing questions of importance to statistical methodology, big data analysis and scientific enquiry more generally.&lt;/div&gt;&lt;/div&gt;&lt;h4 id=&quot;define-variables&quot; style=&quot;text-align: left;&quot;&gt;Explanation of variables above&lt;/h4&gt;&lt;div&gt;&lt;ul style=&quot;text-align: left;&quot;&gt;&lt;li&gt;The model-averaged &lt;i&gt;p&lt;/i&gt;-value, adjusted for multiple testing, is &lt;i&gt;p*&lt;/i&gt;.&lt;/li&gt;&lt;li&gt;The model-averaged posterior odds, calculated from a Bayesian analysis, is &lt;i&gt;PO&lt;/i&gt;.&lt;/li&gt;&lt;li&gt;The number of variables in the analysis is &lt;i&gt;ν&lt;/i&gt;.&lt;/li&gt;&lt;li&gt;The prior odds of including each variable are&amp;nbsp;&lt;i&gt;μ&lt;/i&gt;.&lt;/li&gt;&lt;li&gt;The sample size &lt;i&gt;n&lt;/i&gt; is represented by&amp;nbsp;&lt;i&gt;ξ&lt;sub&gt;n&lt;/sub&gt;&lt;/i&gt;, which decreases as&amp;nbsp;√&lt;i&gt;n&lt;/i&gt; increases.&lt;/li&gt;&lt;/ul&gt;&lt;/div&gt;</description><link>http://blog.danielwilson.me.uk/2025/05/doublethink-simultaneous-bayesian.html</link><author>noreply@blogger.com (Daniel Wilson)</author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="https://blogger.googleusercontent.com/img/b/R29vZ2xl/AVvXsEiOwQIIOEMLlhoaase7IV3Zp98FXcWKlx-Om4jXd4BXGpcRY_j1Z7Uun8VSGUAEmAPIF03rCeDBCHMl356C3tpLhTiltJ4tF2U1Y18XF3Yb-50-zN1kV3GlM3T9zigM3srULvUUTvPKKHvUgWyLxxuSpnh4Sr3PvzGuhe_VRfQd8u_SMPtTUl3c/s72-w400-h53-c/Screenshot%202025-05-12%20at%2011.06.04.png" height="72" width="72"/><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-268474630859071129</guid><pubDate>Wed, 02 Apr 2025 10:14:00 +0000</pubDate><atom:updated>2025-04-02T05:14:04.363-05:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Artificial intelligence</category><category domain="http://www.blogger.com/atom/ns#">Conference</category><category domain="http://www.blogger.com/atom/ns#">David Eyre</category><category domain="http://www.blogger.com/atom/ns#">Genomics</category><category domain="http://www.blogger.com/atom/ns#">Machine learning</category><category domain="http://www.blogger.com/atom/ns#">Microbiology</category><category domain="http://www.blogger.com/atom/ns#">Nicolas Arning</category><category domain="http://www.blogger.com/atom/ns#">Sam Sheppard</category><category domain="http://www.blogger.com/atom/ns#">Statistics</category><title>Machine Learning versus Statistical Inference in Microbial Genomics</title><description>My talk given today at the 2025 Microbiology Society Conference in Liverpool:

&lt;iframe width=&quot;686&quot; height=&quot;386&quot; src=&quot;https://www.youtube.com/embed/rLAFyZMieIs?t=11&quot; title=&quot;Machine Learning versus Statistical Inference in Microbial Genomics&quot; frameborder=&quot;0&quot; allow=&quot;accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture; web-share&quot; referrerpolicy=&quot;strict-origin-when-cross-origin&quot; allowfullscreen&gt;&lt;/iframe&gt;

&lt;h3&gt;Abstract&lt;/h3&gt;
The advent of vast genomic datasets has transformed microbiology, presenting opportunities and challenges for data analysis. The distinct philosophies of machine learning (ML) and statistical inference gives them complementarity strengths and weaknesses in tackling big data problems in pathogen research. While statistical inference prioritizes understanding underlying relationships, ML focuses on optimizing predictive performance. In this talk I will contrast the approaches and offer a view on their relative utility for three problems: source attribution, bacterial genome-wide association studies, and predicting antimicrobial resistance phenotypes from whole genome sequences.
</description><link>http://blog.danielwilson.me.uk/2025/04/machine-learning-versus-statistical.html</link><author>noreply@blogger.com (Daniel Wilson)</author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="https://img.youtube.com/vi/rLAFyZMieIs/default.jpg" height="72" width="72"/><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-2544548877614125369</guid><pubDate>Fri, 15 Nov 2024 12:07:00 +0000</pubDate><atom:updated>2024-11-15T06:08:08.565-06:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Harmonic mean p-value</category><title>What Google AI thinks about the harmonic mean p-value method.</title><description>&lt;p&gt;Thanks to Jeff Chen who asked Google NotebookLM to produce this radio-style audio description of the harmonic mean &lt;i&gt;p&lt;/i&gt;-value paper: &lt;a href=&quot;https://github.com/danny-wilson/danny-wilson.github.io/raw/657c80714f237d31f86159a4d02999296e112d49/files/hmp-google-notebooklm.m4a&quot;&gt;hmp-google-notebooklm.m4a&lt;/a&gt;&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2024/11/what-google-ai-thinks-about-harmonic.html</link><author>noreply@blogger.com (Daniel Wilson)</author><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-7345585506632115195</guid><pubDate>Tue, 30 Jul 2024 03:40:00 +0000</pubDate><atom:updated>2024-07-29T22:40:46.910-05:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Doublethink</category><category domain="http://www.blogger.com/atom/ns#">FDR</category><category domain="http://www.blogger.com/atom/ns#">FWER</category><category domain="http://www.blogger.com/atom/ns#">Helen Fryer</category><category domain="http://www.blogger.com/atom/ns#">Nicolas Arning</category><category domain="http://www.blogger.com/atom/ns#">Statistics</category><title>Doublethink methods paper</title><description>&lt;p&gt;Today we release the first full draft of the &lt;a href=&quot;https://www.danielwilson.me.uk/abstracts/fryer_etal_2024.html&quot;&gt;Doublethink methods paper&lt;/a&gt;. This is an evolution of what was originally conceived as the supplement to the &lt;a href=&quot;https://www.danielwilson.me.uk/abstracts/arning_etal_2024.html&quot;&gt;Doublethink COVID-19 paper&lt;/a&gt;. The wider significance of the results persuaded us to separate the two, which now focus on:&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;ul style=&quot;text-align: left;&quot;&gt;&lt;li&gt;&lt;b&gt;Doublethink methods paper:&lt;/b&gt; Broad connections between Bayesian and classical hypothesis testing that we hope bring the best of both world by enabling scientists to simultaneously control the Bayesian false discovery rate and the classical familywise error rate, in big data settings.&lt;/li&gt;&lt;li&gt;&lt;b&gt;Doublethink COVID-19 paper:&lt;/b&gt; Identifying direct risk factors for COVID-19 hospitalization among 2000 candidate variables in 200,000 UK Biobank participants. Compares results to the literature and considers the limitations imposed by mediation and complex &#39;exposome-wide&#39; association studies.&lt;/li&gt;&lt;/ul&gt;&lt;div&gt;After soliciting colleagues for comments and another round of editing, we will move toward submission in later this year.&lt;/div&gt;&lt;p&gt;&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2024/07/doublethink-methods-paper.html</link><author>noreply@blogger.com (Daniel Wilson)</author><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-369236332749138269</guid><pubDate>Tue, 23 Jan 2024 16:09:00 +0000</pubDate><atom:updated>2024-01-23T10:09:08.547-06:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Antimicrobial resistance</category><category domain="http://www.blogger.com/atom/ns#">Festival of Genomics</category><category domain="http://www.blogger.com/atom/ns#">GWAS</category><category domain="http://www.blogger.com/atom/ns#">Mycobacterium tuberculosis</category><category domain="http://www.blogger.com/atom/ns#">Staphylococcus aureus</category><category domain="http://www.blogger.com/atom/ns#">Virulogenomics</category><title>Festival of Genomics 2024</title><description>&lt;p&gt;I will be talking at the Festival of Genomics on Wednesday 24 January about Identifying virulence and antimicrobial resistance genes in bacterial using genome-wide association studies. You can preview my talk here.&lt;/p&gt;

&lt;iframe allow=&quot;autoplay&quot; allowfullscreen=&quot;&quot; aria-label=&quot;Panopto Embedded Video Player&quot; height=&quot;405&quot; src=&quot;https://ox.cloud.panopto.eu/Panopto/Pages/Embed.aspx?id=5b7e6857-42a1-492f-8453-b10000f2bdb3&amp;amp;autoplay=false&amp;amp;offerviewer=true&amp;amp;showtitle=true&amp;amp;showbrand=true&amp;amp;captions=false&amp;amp;interactivity=all&quot; style=&quot;border: 1px solid #464646;&quot; width=&quot;720&quot;&gt;&lt;/iframe&gt;
</description><link>http://blog.danielwilson.me.uk/2024/01/festival-of-genomics-2024.html</link><author>noreply@blogger.com (Daniel Wilson)</author><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-2940722230892843044</guid><pubDate>Wed, 03 Jan 2024 14:18:00 +0000</pubDate><atom:updated>2024-01-03T10:13:50.358-06:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">COVID-19</category><category domain="http://www.blogger.com/atom/ns#">Doublethink</category><category domain="http://www.blogger.com/atom/ns#">FDR</category><category domain="http://www.blogger.com/atom/ns#">FWER</category><category domain="http://www.blogger.com/atom/ns#">Helen Fryer</category><category domain="http://www.blogger.com/atom/ns#">Nicolas Arning</category><category domain="http://www.blogger.com/atom/ns#">UK Biobank</category><title>Introducing Doublethink: joint Bayesian-frequentist model-averaged hypothesis testing</title><description>&lt;p&gt;This week Nick Arning, Helen Fryer and I released two related preprints describing a new method called Doublethink, and its application to identifying risk factors for COVID-19 hospitalization in UK Biobank:&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;ul style=&quot;text-align: left;&quot;&gt;&lt;li&gt;&lt;a href=&quot;https://www.danielwilson.me.uk/abstracts/fryer_etal_2024.html&quot;&gt;Doublethink: simultaneous Bayesian-frequentist model-averaged hypothesis testing&lt;/a&gt;. Fryer, Arning, Wilson (2023)&amp;nbsp;&lt;i&gt;arXiv&lt;/i&gt;&amp;nbsp;&lt;b&gt;doi&lt;/b&gt;: 10.48550/arXiv.2312.17566&lt;/li&gt;&lt;/ul&gt;&lt;ul style=&quot;text-align: left;&quot;&gt;&lt;li&gt;&lt;a href=&quot;https://www.danielwilson.me.uk/abstracts/arning_etal_2024.html&quot;&gt;Identifying direct risk factors in UK Biobank with simultaneous Bayesian-frequentist model-averaged hypothesis testing using Doublethink&lt;/a&gt;. Arning, Fryer, Wilson (2024)&amp;nbsp;&lt;i&gt;medRxiv&lt;/i&gt; &lt;b&gt;doi&lt;/b&gt;: 10.1101/2024.01.01.24300687&lt;/li&gt;&lt;/ul&gt;&lt;h4 style=&quot;text-align: left;&quot;&gt;Doublethink: Bayesian-frequentist model-averaged hypothesis testing&lt;/h4&gt;&lt;div&gt;Doublethink enables joint Bayesian and frequentist hypothesis testing when there is model uncertainty by interconverting Bayesian posterior odds and classical (frequentist)&amp;nbsp;&lt;i&gt;p&lt;/i&gt;-values. It has broad implications because (i) it reveals connections between the Bayesian approach to model averaging and the classical approach to multiple testing, and (ii) it brings the benefits of Bayesian model averaging to classical statistics.&lt;/div&gt;&lt;div&gt;Doublethink addresses two fundamental problems in hypothesis testing:&lt;/div&gt;&lt;div&gt;&lt;ol style=&quot;text-align: left;&quot;&gt;&lt;li&gt;In classical tests, the statistical evidence that one variable directly affects an outcome generally depends on which other variables are assumed to directly affect it.&lt;/li&gt;&lt;li&gt;In Bayesian tests, the statistical evidence that one variable directly affects an outcome depends on the prior assumptions.&lt;/li&gt;&lt;/ol&gt;&lt;/div&gt;&lt;div&gt;These issues are addressed by computing &lt;i&gt;p&lt;/i&gt;-values from Bayesian model-averaged posterior odds, which (1) account for model uncertainty and (2) are theoretically invariant to prior assumptions, assuming large sample sizes.&lt;/div&gt;&lt;div&gt;Doublethink simultaneously controls the frequentist family-wise error rate (&lt;a href=&quot;https://en.wikipedia.org/wiki/Family-wise_error_rate&quot;&gt;FWER&lt;/a&gt;) and the Bayesian false discovery rate (&lt;a href=&quot;https://doi.org/10.1214/009053606000001460&quot;&gt;FDR&lt;/a&gt;). It builds on &lt;a href=&quot;https://web.stat.tamu.edu/~vjohnson/&quot;&gt;Johnson&#39;s&lt;/a&gt; Bayesian tests based on likelihood ratio statistics, and &lt;a href=&quot;https://en.wikipedia.org/wiki/Jovan_Karamata&quot;&gt;Karamata&#39;s&lt;/a&gt; theory of regular variation.&lt;/div&gt;&lt;div&gt;&lt;h4&gt;Identifying direct risk factors in UK Biobank with Doublethink&lt;/h4&gt;&lt;/div&gt;&lt;div&gt;We applied Doublethink to identify direct risk factors for COVID-19 hospitalization in UK Biobank. This is a well-studied problem but we took an &#39;exposome-wide&#39; approach in which we evaluated whether 1,900 variables measured in the UK Biobank each affected the outcome. This is still an under-utilized approach in epidemiology, which usually focuses on candidate risk factors.&lt;/div&gt;&lt;div&gt;Exposome-wide approaches have potential benefits over candidate risk factor approaches, including:&lt;/div&gt;&lt;div&gt;&lt;ul style=&quot;text-align: left;&quot;&gt;&lt;li&gt;The ability to discover unexpected results.&lt;/li&gt;&lt;li&gt;Stringent control for multiple testing.&lt;/li&gt;&lt;li&gt;Avoidance of bias in choosing candidate risk factors or deciding to publish.&lt;/li&gt;&lt;/ul&gt;&lt;div&gt;However, we only studied the direct effects of variables on the outcome. This means we cannot make statements about the total (direct and indirect) effects of a variable, e.g. smoking, on the outcome, which are needed in applications like assessing potential interventions.&lt;/div&gt;&lt;/div&gt;&lt;div&gt;We identified individual variables and groups of variables that were &#39;exposome-wide significant&#39; at 9% FDR and 0.05% FWER, after accounting for the direct effects of all other variables.&lt;/div&gt;&lt;div&gt;&lt;br /&gt;&lt;/div&gt;&lt;div class=&quot;separator&quot; style=&quot;clear: both; text-align: center;&quot;&gt;&lt;a href=&quot;https://blogger.googleusercontent.com/img/b/R29vZ2xl/AVvXsEgUyXxGT1JLVehheG2OWFrVHIbMOuvchxQK8bLZDVbxZbZwRI6xywNBJUOdX7wKT_r1fCfT13ukaWJdoiuBoDTt4TpQLZLIY-ZHfZFQ1YsgpDklQbUD98g-ThFM9Y83Tcc6hyuLCdBoWn-lXK1SRtG1XY-7dNcBMZKcX3qPKXHlPmVprv0agrzW/s1092/Figure1.png&quot; style=&quot;margin-left: 1em; margin-right: 1em;&quot;&gt;&lt;img border=&quot;0&quot; data-original-height=&quot;590&quot; data-original-width=&quot;1092&quot; height=&quot;346&quot; src=&quot;https://blogger.googleusercontent.com/img/b/R29vZ2xl/AVvXsEgUyXxGT1JLVehheG2OWFrVHIbMOuvchxQK8bLZDVbxZbZwRI6xywNBJUOdX7wKT_r1fCfT13ukaWJdoiuBoDTt4TpQLZLIY-ZHfZFQ1YsgpDklQbUD98g-ThFM9Y83Tcc6hyuLCdBoWn-lXK1SRtG1XY-7dNcBMZKcX3qPKXHlPmVprv0agrzW/w640-h346/Figure1.png&quot; width=&quot;640&quot; /&gt;&lt;/a&gt;&lt;/div&gt;&lt;div&gt;Comparing our results to over 100 published studies of COVID-19 in UK Biobank, we&lt;/div&gt;&lt;div&gt;&lt;ul style=&quot;text-align: left;&quot;&gt;&lt;li&gt;Recapitulated several commonly reported direct risk factors, e.g. age, sex, and obesity.&lt;/li&gt;&lt;li&gt;Excluded others, e.g. diabetes, cardiovascular disease, and hypertension, which might be mediated through other variables that measure general comorbidity.&lt;/li&gt;&lt;li&gt;Identified some infrequently reported direct risk factors, both individually, e.g. lung infection, and as groups, e.g. constipation/urinary tract infection, which might reflect underlying kidney disease.&lt;/li&gt;&lt;/ul&gt;&lt;/div&gt;&lt;div&gt;The ability to test groups of variables, which increases sensitivity, was one of the benefits of Doublethink&#39;s model-averaging approach. It is particularly helpful in large biobanks that measure thousands of variables, because correlation between variables is pervasive, and can dilute the significance of individual variables that measure similar phenomena, like the numerous types of deprivation index. It serves as a flexible alternative to pre-analysis variable filtering algorithms, while controlling the risk of false positives by pre-defining significance thresholds for all possible tests.&lt;/div&gt;&lt;div&gt;To read more, please check out the preprints&amp;nbsp;&lt;a href=&quot;https://www.danielwilson.me.uk/abstracts/fryer_etal_2024.html&quot;&gt;here&lt;/a&gt;&amp;nbsp;and&amp;nbsp;&lt;a href=&quot;https://www.danielwilson.me.uk/abstracts/arning_etal_2024.html&quot;&gt;here&lt;/a&gt;.&lt;/div&gt;&lt;p&gt;&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2024/01/introducing-doublethink-joint-bayesian.html</link><author>noreply@blogger.com (Daniel Wilson)</author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="https://blogger.googleusercontent.com/img/b/R29vZ2xl/AVvXsEgUyXxGT1JLVehheG2OWFrVHIbMOuvchxQK8bLZDVbxZbZwRI6xywNBJUOdX7wKT_r1fCfT13ukaWJdoiuBoDTt4TpQLZLIY-ZHfZFQ1YsgpDklQbUD98g-ThFM9Y83Tcc6hyuLCdBoWn-lXK1SRtG1XY-7dNcBMZKcX3qPKXHlPmVprv0agrzW/s72-w640-h346-c/Figure1.png" height="72" width="72"/><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-2446431935516555799</guid><pubDate>Wed, 28 Sep 2022 13:38:00 +0000</pubDate><atom:updated>2022-09-28T08:41:00.510-05:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Continuing Education</category><category domain="http://www.blogger.com/atom/ns#">COVID-19</category><category domain="http://www.blogger.com/atom/ns#">Talk</category><title>Rewley House Lecture: Role of data science in the pandemic</title><description>&lt;p&gt;This year I was invited to give the &lt;a href=&quot;https://www.conted.ox.ac.uk/about/rewley-house-lecture-series&quot;&gt;Rewley House Lecture&lt;/a&gt;, a multidisciplinary research talk open to all, at the &lt;a href=&quot;https://www.conted.ox.ac.uk&quot;&gt;Department for Continuing Education&lt;/a&gt;, where I am Director of Studies in &lt;a href=&quot;https://www.conted.ox.ac.uk/about/computing-and-mathematics-and-data-science&quot;&gt;Data Science&lt;/a&gt;.&lt;/p&gt;&lt;p&gt;I talked about how data science has been used during the COVID-19 pandemic, spanning vaccine design, clinical trials, surveillance and policy advice, and highlighting the identification of risk factors for disease.&lt;/p&gt;&lt;p&gt;If you like this talk, you might be interested in the following courses available this academic year:&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;ul style=&quot;text-align: left;&quot;&gt;&lt;li&gt;&lt;a href=&quot;https://www.conted.ox.ac.uk/courses/infectious-disease-modelling-mathematical-techniques?code=O22P764COW&quot;&gt;Infectious Disease Modelling: Mathematical Techniques&lt;/a&gt;&amp;nbsp;(September 2022)&lt;/li&gt;&lt;li&gt;&lt;a href=&quot;https://www.conted.ox.ac.uk/courses/infectious-disease-modelling-applied-methods-in-r?code=O22P771COW&quot;&gt;Infectious Disease Modelling: Applied Methods in R&lt;/a&gt;&amp;nbsp;(January 2023)&lt;/li&gt;&lt;li&gt;&lt;a href=&quot;https://www.conted.ox.ac.uk/courses/pandemic-data-science?code=O22P781COW&quot;&gt;Pandemic Data Science&lt;/a&gt;&amp;nbsp;(April 2023)&lt;/li&gt;&lt;/ul&gt;&lt;p&gt;&lt;/p&gt;&lt;div class=&quot;separator&quot; style=&quot;clear: both; text-align: center;&quot;&gt;&lt;iframe allowfullscreen=&quot;&quot; class=&quot;BLOG_video_class&quot; height=&quot;359&quot; src=&quot;https://www.youtube.com/embed/pfqh3pdcF-0&quot; width=&quot;479&quot; youtube-src-id=&quot;pfqh3pdcF-0&quot;&gt;&lt;/iframe&gt;&lt;/div&gt;&lt;br /&gt;</description><link>http://blog.danielwilson.me.uk/2022/09/rewley-house-lecture-role-of-data.html</link><author>noreply@blogger.com (Daniel Wilson)</author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="https://img.youtube.com/vi/pfqh3pdcF-0/default.jpg" height="72" width="72"/><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-3097086397686886467</guid><pubDate>Thu, 25 Aug 2022 15:37:00 +0000</pubDate><atom:updated>2022-08-25T10:37:47.136-05:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Antibiotics</category><category domain="http://www.blogger.com/atom/ns#">Antimicrobial resistance</category><category domain="http://www.blogger.com/atom/ns#">Bill &amp; Melinda Gates Foundation</category><category domain="http://www.blogger.com/atom/ns#">CRyPTIC</category><category domain="http://www.blogger.com/atom/ns#">MRC</category><category domain="http://www.blogger.com/atom/ns#">Newton Fund</category><category domain="http://www.blogger.com/atom/ns#">PLoS Biology</category><category domain="http://www.blogger.com/atom/ns#">Wellcome Trust</category><title>Identifying resistance genes in tuberculosis</title><description>&lt;p&gt;Newly published in &lt;a href=&quot;https://journals.plos.org/plosbiology/article?id=10.1371/journal.pbio.3001755&quot;&gt;&lt;i&gt;PLOS Biology&lt;/i&gt; is our work identifying genes that confer resistance to common and last-resort antibiotics&lt;/a&gt; in bacteria that cause tuberculosis. Resistance to these drugs contributes to mortality and sickness on a pandemic scale every year, and disproportionately affects the poorest people in the world.&lt;/p&gt;&lt;p&gt;This new article is one of a series presenting results generated by more than 100 scientists across 23 countries across 5+ years as part of a collaboration called &lt;a href=&quot;http://www.crypticproject.org&quot;&gt;CRyPTIC&lt;/a&gt;.&lt;/p&gt;&lt;p&gt;Our role in CRyPTIC&amp;nbsp;was the discovery of genes and mutations likely to cause drug resistance by applying a tool known as a genome-wide association study (GWAS), an approach we&amp;nbsp;&lt;a href=&quot;http://blog.danielwilson.me.uk/2016/04/making-most-of-bacterial-gwas-new-paper.html&quot;&gt;helped adapt to bacteria&lt;/a&gt;.&lt;/p&gt;&lt;p&gt;Using GWAS, we identified previously uncatalogued genes and mutations underlying resistance to every one of the 13 drugs we investigated. These include new and repurposed drugs, as well as the first- and second-line drugs more often used to treat tuberculosis.&lt;/p&gt;&lt;p&gt;Thanks to its generous funders, CRyPTIC dedicated scale (10,000+ genomes) and technical innovation (new high-throughput MIC assays) to help decode the DNA blueprint of antibiotic resistance. Pushing these boundaries has yielded a steep increase of up to 36% in the variation in resistance attributable to the genome for the important and previously understudied new and repurposed drugs.&lt;/p&gt;&lt;p&gt;Science at this scale can produce a seemingly overwhelming wealth of new information. We avoided the temptation to over-emphasize any individual result for the sake of simple narrative. Instead, we highlighted discoveries of uncatalogued genes or genetic variants that we found for every drug investigated:&lt;/p&gt;&lt;p&gt;•&lt;span class=&quot;Apple-tab-span&quot; style=&quot;white-space: pre;&quot;&gt;	&lt;/span&gt;The amidase AmiA2 and GTPase Era for bedaquiline.&lt;/p&gt;&lt;p&gt;•&lt;span class=&quot;Apple-tab-span&quot; style=&quot;white-space: pre;&quot;&gt;	&lt;/span&gt;The cytochrome P450 enzyme Cyp142 for clofazimine.&lt;/p&gt;&lt;p&gt;•&lt;span class=&quot;Apple-tab-span&quot; style=&quot;white-space: pre;&quot;&gt;	&lt;/span&gt;The serine/threonine protein kinase PknH for delaminid.&lt;/p&gt;&lt;p&gt;•&lt;span class=&quot;Apple-tab-span&quot; style=&quot;white-space: pre;&quot;&gt;	&lt;/span&gt;The antitoxin VapB20 for linezolid.&lt;/p&gt;&lt;p&gt;•&lt;span class=&quot;Apple-tab-span&quot; style=&quot;white-space: pre;&quot;&gt;	&lt;/span&gt;The PPE-motif family outer membrane protein PPE42 for amikacin and kanamycin.&lt;/p&gt;&lt;p&gt;•&lt;span class=&quot;Apple-tab-span&quot; style=&quot;white-space: pre;&quot;&gt;	&lt;/span&gt;The antibiotic-induced transcriptional regulator WhiB7 for ethionamide.&lt;/p&gt;&lt;p&gt;•&lt;span class=&quot;Apple-tab-span&quot; style=&quot;white-space: pre;&quot;&gt;	&lt;/span&gt;The rRNA methylase TlyA for levofloxacin.&lt;/p&gt;&lt;p&gt;•&lt;span class=&quot;Apple-tab-span&quot; style=&quot;white-space: pre;&quot;&gt;	&lt;/span&gt;The DNA gyrase subunit B GyrB for moxifloxacin.&lt;/p&gt;&lt;p&gt;•&lt;span class=&quot;Apple-tab-span&quot; style=&quot;white-space: pre;&quot;&gt;	&lt;/span&gt;The putative rhodaneses CysA2 and CysA3 for rifabutin.&lt;/p&gt;&lt;p&gt;•&lt;span class=&quot;Apple-tab-span&quot; style=&quot;white-space: pre;&quot;&gt;	&lt;/span&gt;The tRNA/rRNA methylase SpoU for ethambutol and rifampicin.&lt;/p&gt;&lt;p&gt;•&lt;span class=&quot;Apple-tab-span&quot; style=&quot;white-space: pre;&quot;&gt;	&lt;/span&gt;The multidrug efflux transport system repressor Rv1219 for isoniazid.&lt;/p&gt;&lt;p&gt;All these hits passed stringent evidence thresholds that take into account the large amount of data crunched. For each hit, we identified possible relationships between gene functions, such as they are known, and the mechanism of action of the antibiotics.&lt;/p&gt;&lt;p&gt;Beyond the biological discoveries of primary interest, this new paper unveils methodological advances in bacterial GWAS. We introduced a systematic, whole-genome approach to analysing not just short DNA sequences (so called oligonucleotide or “kmer”-based approaches), but also short sequences of the proteins that the DNA codes for (an oligopeptide-based approach). We have released our software on an &lt;a href=&quot;https://github.com/danny-wilson/kmer_pipeline&quot;&gt;open-source GitHub repository&lt;/a&gt;.&lt;/p&gt;&lt;p&gt;We also discovered a relationship that may help disentangle a technical issue in bacterial GWAS where the co-occurence of traits can trick us into thinking that a gene influences one trait when it influences another instead. For antimicrobial resistance, this issue is known as artefactual cross resistance. We observed that true associations tended to produce larger associations (as measured by the &#39;coefficient&#39;, rather than the &lt;i&gt;p&lt;/i&gt;-value), providing a possible way to prioritize signals in the future.&lt;/p&gt;&lt;p&gt;This paper was published alongside the CRyPTIC &lt;a href=&quot;https://journals.plos.org/plosbiology/article?id=10.1371/journal.pbio.3001721&quot;&gt;Data Compendium in &lt;i&gt;PLOS Biology&lt;/i&gt;&lt;/a&gt;, in which we released our data open source to the community, with resources provided by the &lt;a href=&quot;http://ftp.ebi.ac.uk/pub/databases/cryptic/release_june2022/&quot;&gt;European Bioinformatics Institute&lt;/a&gt;.&lt;/p&gt;&lt;p&gt;Some of the results of CRyPTIC have already been rushed into service by the &lt;a href=&quot;https://www.who.int/publications/i/item/9789240028173&quot;&gt;World Health Organization&lt;/a&gt; on the grounds of exceptional importance based on a candidate gene approach; this includes the DNA gyrase subunit B – moxifloxacin association spotlighted above (&lt;a href=&quot;https://www.thelancet.com/journals/lanmic/article/PIIS2666-5247(21)00301-3/fulltext&quot;&gt;Walker et al 2022&lt;/a&gt;). However, the new results go beyond a candidate gene approach, detecting a range of previously uncatalogued genes via its agnostic, whole-genome strategy.&lt;/p&gt;&lt;p&gt;Unpicking the genetics of antimicrobial resistance is a priority for improving rapid susceptibility tests for individual patients, selecting drug regimens that inhibit the evolution of multidrug resistance, and developing improved treatment options. The need is particularly great in &lt;i&gt;M. tuberculosis&lt;/i&gt;, which killed 1.4 million people in 2019, owing to the slow (6-12 week) turnaround of traditional susceptibility testing, and the alarming threat of multidrug resistant tuberculosis. The discovery of many new candidate resistance variants therefore represents an advance that we hope will contribute to progress in reducing the burden of disease.&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2022/08/identifying-resistance-genes-in.html</link><author>noreply@blogger.com (Daniel Wilson)</author><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-5032409258565440721</guid><pubDate>Wed, 23 Feb 2022 09:20:00 +0000</pubDate><atom:updated>2022-02-23T03:20:36.085-06:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Big Data Institute</category><category domain="http://www.blogger.com/atom/ns#">Genomics</category><category domain="http://www.blogger.com/atom/ns#">Infection</category><category domain="http://www.blogger.com/atom/ns#">Postdoc</category><category domain="http://www.blogger.com/atom/ns#">Recruitment</category><category domain="http://www.blogger.com/atom/ns#">Statistics</category><title>Seeking Postdoc in Statistical Genetics and Infectious Disease</title><description>&lt;p&gt;I am seeking a &lt;a href=&quot;https://my.corehr.com/pls/uoxrecruit/erq_jobspec_version_4.display_form?p_company=10&amp;amp;p_internal_external=E&amp;amp;p_display_in_irish=N&amp;amp;p_process_type=&amp;amp;p_applicant_no=&amp;amp;p_form_profile_detail=&amp;amp;p_display_apply_ind=Y&amp;amp;p_refresh_search=Y&amp;amp;p_recruitment_id=156258&quot;&gt;senior postdoc in Statistical Genetics and Infectious Disease&lt;/a&gt; to join my research group at the Big Data Institute, University of Oxford. Our research into Infectious Disease Genomics is focused on developing and applying big data methods to identify genetic risk factors for disease, both microbial virulence factors and human susceptibility genes. We are focused on a range of bacterial and viral diseases including staphylococcal sepsis and COVID-19.&lt;/p&gt;&lt;p&gt;The &lt;a href=&quot;https://www.bdi.ox.ac.uk&quot;&gt;Big Data Institute&lt;/a&gt;, part of &lt;a href=&quot;https://www.ndph.ox.ac.uk&quot;&gt;Oxford Population Health&lt;/a&gt;, provides an excellent environment for multi-disciplinary research and teaching. Situated on the modern Old Road Campus in the heart of the medical sciences neighbourhood of Headington, we benefit from outstanding facilities and opportunities to collaborate with world-leading scientists and clinicians to help expand knowledge and improve global health.&lt;/p&gt;&lt;p&gt;As a Senior Postdoc the post-holder will work closely with me to jointly lead the implementation, design and application of new statistical tools for genome-wide association studies, and to lead the biological interpretation of key findings. They will develop novel methodologies for analysis and data collection, take the lead in the production of scientific reports and publications and supervise junior group members.&lt;/p&gt;&lt;p&gt;To be considered applicants will have a PhD and post-doctoral experience in a relevant subject, with direct experience in statistical genetics, demonstrable expertise and knowledge of the statistical genetics literature or a closely related, relevant discipline and a publication record as first author, in statistical genetics.&lt;/p&gt;&lt;p&gt;The position is full time (part time considered) and fixed-term for 3 years.&lt;/p&gt;&lt;p&gt;&lt;b&gt;The closing date for application is 12.00 noon GMT on 18th March.&lt;/b&gt;&lt;/p&gt;&lt;div&gt;&lt;a href=&quot;https://my.corehr.com/pls/uoxrecruit/erq_jobspec_version_4.display_form?p_company=10&amp;amp;p_internal_external=E&amp;amp;p_display_in_irish=N&amp;amp;p_process_type=&amp;amp;p_applicant_no=&amp;amp;p_form_profile_detail=&amp;amp;p_display_apply_ind=Y&amp;amp;p_refresh_search=Y&amp;amp;p_recruitment_id=156258&quot;&gt;Click here&lt;/a&gt; for more information including how to apply.&lt;/div&gt;</description><link>http://blog.danielwilson.me.uk/2022/02/seeking-postdoc-in-statistical-genetics.html</link><author>noreply@blogger.com (Daniel Wilson)</author><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-7010064572816128856</guid><pubDate>Wed, 23 Feb 2022 08:09:00 +0000</pubDate><atom:updated>2022-02-23T02:13:31.292-06:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Statistical Genomics Summer School</category><category domain="http://www.blogger.com/atom/ns#">Teaching</category><title>Announcing the Oxford Statistical Genomics Summer School 2022</title><description>&lt;p&gt;Join us at St Hilda&#39;s College Oxford, overlooking the River Cherwell and Christ Church Meadow, for an &lt;a href=&quot;https://www.conted.ox.ac.uk/courses/oxford-statistical-genomics-summer-school?code=O22I410SGS&quot;&gt;immersive week-long residential post-graduate summer school on Statistical Genomics&lt;/a&gt;&amp;nbsp;on 19th-24th June 2022. This course aims to connect post-graduate and post-doctoral researchers from academia and industry with experts at Oxford&#39;s Big Data Institute, Wellcome Centre for Human Genetics, and Department of Statistics.&lt;/p&gt;&lt;p&gt;Our friendly tutors, internationally recognised for their scientific expertise, will offer specialist instruction and hands-on computer practicals across five broad areas of Statistical Genomics: Next-generation Sequence Data Analysis, Gene and Variant Association Testing, Genomics of Infectious Diseases, Genealogical Inference and Analysis, and Medical Genomics.&lt;/p&gt;&lt;p&gt;The course is aimed at trainee scientists actively engaged in statistical genomics research, who wish to expand their knowledge of concepts and techniques.&lt;/p&gt;&lt;p&gt;&lt;a href=&quot;https://www.conted.ox.ac.uk/courses/oxford-statistical-genomics-summer-school?code=O22I410SGS&quot;&gt;Click here&lt;/a&gt; for more information including how to apply.&lt;/p&gt;&lt;div class=&quot;separator&quot; style=&quot;clear: both; text-align: center;&quot;&gt;&lt;a href=&quot;https://blogger.googleusercontent.com/img/a/AVvXsEhn5TnR6c7bDg8zHztc5MZna6-FRartPmbVKbyKiDW5x2yT0GHDiAIRzajelH-4A5gWoMkhxn6Uc2f9rAVsrKFbgAvXm3paPAYh25iNg26n7sBHURyBIrqnWaNTL0BJignTqcW0hu3tJYORqnrLRc7cIhIBAPRKBs1a25iATiCz33TMRys8AA=s1600&quot; style=&quot;margin-left: 1em; margin-right: 1em;&quot;&gt;&lt;img border=&quot;0&quot; data-original-height=&quot;1066&quot; data-original-width=&quot;1600&quot; height=&quot;426&quot; src=&quot;https://blogger.googleusercontent.com/img/a/AVvXsEhn5TnR6c7bDg8zHztc5MZna6-FRartPmbVKbyKiDW5x2yT0GHDiAIRzajelH-4A5gWoMkhxn6Uc2f9rAVsrKFbgAvXm3paPAYh25iNg26n7sBHURyBIrqnWaNTL0BJignTqcW0hu3tJYORqnrLRc7cIhIBAPRKBs1a25iATiCz33TMRys8AA=w640-h426&quot; width=&quot;640&quot; /&gt;&lt;/a&gt;&lt;/div&gt;&lt;br /&gt;&lt;p&gt;&lt;br /&gt;&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2022/02/announcing-oxford-statistical-genomics.html</link><author>noreply@blogger.com (Daniel Wilson)</author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="https://blogger.googleusercontent.com/img/a/AVvXsEhn5TnR6c7bDg8zHztc5MZna6-FRartPmbVKbyKiDW5x2yT0GHDiAIRzajelH-4A5gWoMkhxn6Uc2f9rAVsrKFbgAvXm3paPAYh25iNg26n7sBHURyBIrqnWaNTL0BJignTqcW0hu3tJYORqnrLRc7cIhIBAPRKBs1a25iATiCz33TMRys8AA=s72-w640-h426-c" height="72" width="72"/><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-1439978819152502760</guid><pubDate>Wed, 26 Jan 2022 10:26:00 +0000</pubDate><atom:updated>2022-01-26T04:26:15.130-06:00</atom:updated><title>Postdoctoral and Ph.D. positions in the group</title><description>&lt;p&gt;If you are interested in joining the group, please contact me (&lt;a href=&quot;http://www.danielwilson.me.uk/contact.html&quot;&gt;details here&lt;/a&gt;) with a brief explanation and a copy of an up-to-date CV.&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2022/01/postdoctoral-and-phd-positions-in-group.html</link><author>noreply@blogger.com (Daniel Wilson)</author><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-4829692579662920826</guid><pubDate>Tue, 25 Jan 2022 14:26:00 +0000</pubDate><atom:updated>2022-01-25T08:26:47.551-06:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Conference</category><category domain="http://www.blogger.com/atom/ns#">GWAS</category><category domain="http://www.blogger.com/atom/ns#">Population Genetics</category><category domain="http://www.blogger.com/atom/ns#">ProbGen</category><category domain="http://www.blogger.com/atom/ns#">Selection</category><category domain="http://www.blogger.com/atom/ns#">Statistics</category><title>Announcing ProbGen22 in Oxford 28-30 March</title><description>&lt;p&gt;The organizing committee is pleased to announce the 7th Probabilistic Modeling in Genomics Conference (ProbGen22) to be held at the Blavatnik School of Government and Somerville College Oxford from 28th-30th March 2022.&lt;/p&gt;&lt;p&gt;The meeting will be a hybrid in-person and online event. Talk sessions will feature live speakers, both in-person and online, and will take place during the afternoons (making live attendance feasible for US timezones). Talks will be recorded and made available to registrants for a period of one month. Poster sessions will be held online during the evenings.&lt;/p&gt;&lt;p&gt;The conference will cover probabilistic models, algorithms, and statistical methods across a broad range of applications in genetics and genomics. We invite abstract submissions on a range of topics including population genetics, natural selection, Quantitative genetics, Methods for GWAS, Applications to cancer and other diseases, Causal inference in genetic studies, Functional genomics, Assembly and variant identification, Phylogenetics, Single cell &#39;omics, Deep learning in genomics and Pathogen genomics.&lt;/p&gt;&lt;p&gt;&lt;b&gt;The registration deadline is 28th February 2022.&lt;/b&gt;&lt;/p&gt;&lt;p&gt;For more details &lt;a href=&quot;https://probgen22.github.io&quot;&gt;visit the conference website.&lt;/a&gt;&amp;nbsp;&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2022/01/announcing-probgen22-in-oxford-28-30.html</link><author>noreply@blogger.com (Daniel Wilson)</author><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-8367112291038402300</guid><pubDate>Tue, 07 Dec 2021 13:16:00 +0000</pubDate><atom:updated>2021-12-07T07:19:27.927-06:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Big Data Institute</category><category domain="http://www.blogger.com/atom/ns#">Bioinformatics</category><category domain="http://www.blogger.com/atom/ns#">GWAS</category><category domain="http://www.blogger.com/atom/ns#">Postdoc</category><category domain="http://www.blogger.com/atom/ns#">Recruitment</category><category domain="http://www.blogger.com/atom/ns#">Statistics</category><title>Two new positions: Senior Statistical Geneticist and Bioinformatician</title><description>&lt;p&gt;Two new positions are available in my &lt;a href=&quot;http://www.danielwilson.me.uk/index.html&quot;&gt;Infectious Disease Genomics group&lt;/a&gt; at the Big Data Institute, University of Oxford.&lt;/p&gt;&lt;p&gt;A &lt;a href=&quot;https://my.corehr.com/pls/uoxrecruit/erq_jobspec_version_4.display_form?p_company=10&amp;amp;p_internal_external=E&amp;amp;p_display_in_irish=N&amp;amp;p_process_type=&amp;amp;p_applicant_no=&amp;amp;p_form_profile_detail=&amp;amp;p_display_apply_ind=Y&amp;amp;p_refresh_search=Y&amp;amp;p_recruitment_id=154256&quot;&gt;Senior Postdoctoral Statistical Geneticist&lt;/a&gt; to jointly lead the implementation, design and application of new statistical tools for genome-wide association studies, lead the biological interpretation of key findings, develop methodologies and supervise junior group members. This post would suit a candidate with a PhD and relevant post-doctoral experience including direct experience in statistical genetics. Candidates without post-doctoral experience may be considered for a less senior appointment.&lt;/p&gt;&lt;p&gt;A &lt;a href=&quot;https://my.corehr.com/pls/uoxrecruit/erq_jobspec_version_4.display_form?p_company=10&amp;amp;p_internal_external=E&amp;amp;p_display_in_irish=N&amp;amp;p_process_type=&amp;amp;p_applicant_no=&amp;amp;p_form_profile_detail=&amp;amp;p_display_apply_ind=Y&amp;amp;p_refresh_search=Y&amp;amp;p_recruitment_id=154255&quot;&gt;Bioinformatician&lt;/a&gt; to provide expertise for computationally intensive analyses including genome-wide association studies and RNAseq studies of differential gene expression, as well as contributing to informatics projects as part of a wider collaboration with national biomedical cohorts. This post would suit a candidate with either a post-graduate degree related to Bioinformatics, Statistics, and Computing or equivalent experience in industry.&lt;/p&gt;&lt;p&gt;The application deadline for both posts is Noon GMT on &lt;b&gt;Friday 7th January 2022&lt;/b&gt;.&lt;/p&gt;&lt;p&gt;&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2021/12/two-new-positions-senior-statistical.html</link><author>noreply@blogger.com (Daniel Wilson)</author><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-6993243609130828138</guid><pubDate>Tue, 07 Dec 2021 12:08:00 +0000</pubDate><atom:updated>2021-12-07T06:14:18.672-06:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Campylobacter jejuni</category><category domain="http://www.blogger.com/atom/ns#">David Clifton</category><category domain="http://www.blogger.com/atom/ns#">Machine learning</category><category domain="http://www.blogger.com/atom/ns#">Nicolas Arning</category><category domain="http://www.blogger.com/atom/ns#">PLoS Genetics</category><category domain="http://www.blogger.com/atom/ns#">Sam Sheppard</category><category domain="http://www.blogger.com/atom/ns#">Transmission</category><title>New paper: Machine learning to predict the source of campylobacteriosis using whole genome data</title><description>&lt;p&gt;This study, published in October in &lt;i&gt;&lt;a href=&quot;https://journals.plos.org/plosgenetics/article?id=10.1371/journal.pgen.1009436&quot;&gt;PLOS Genetics&lt;/a&gt;&lt;/i&gt;, brings together machine learning, large bacterial isolate collections and whole genome sequencing to address the general problem of how to trace the source of human infections.&lt;/p&gt;&lt;p&gt;Specifically, we investigated &lt;a href=&quot;https://en.wikipedia.org/wiki/Campylobacteriosis&quot;&gt;campylobacteriosis&lt;/a&gt;, a common infection of animal origin causing ~1.5 million cases of gastroenteritis and 10,000 hospitalizations every year in the United States alone. We show that our combined machine learning/genomics analyses:&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;ul style=&quot;text-align: left;&quot;&gt;&lt;li&gt;Improve the accuracy with which infections can be traced back to farm reservoirs.&lt;/li&gt;&lt;li&gt;Identify evolutionary shifts in bacterial affinity for livestock host species.&lt;/li&gt;&lt;li&gt;Detect changes in human infection capability within related strains.&lt;/li&gt;&lt;/ul&gt;&lt;p&gt;&lt;/p&gt;&lt;p&gt;These results will improve understanding not only of&lt;i&gt; Campylobacter&lt;/i&gt;, but more generally as these technologies can readily be applied to other important bacterial pathogen species.&lt;/p&gt;&lt;div class=&quot;separator&quot; style=&quot;clear: both; text-align: center;&quot;&gt;&lt;a href=&quot;https://journals.plos.org/plosgenetics/article?id=10.1371/journal.pgen.1009436&quot; style=&quot;margin-left: 1em; margin-right: 1em;&quot;&gt;&lt;img border=&quot;0&quot; data-original-height=&quot;1665&quot; data-original-width=&quot;1670&quot; height=&quot;319&quot; src=&quot;https://blogger.googleusercontent.com/img/a/AVvXsEg5IaGadnQr7wCxPK-m3PQk6YrGwI4n4WDEcPtLhsRrQvBZP3ovcq5uOI3M-pw78WS3niSIJd7rYeqH79D07-7DqRgO_DMOECY3Q04S2NotmlgqnlGCEprPF383hc0wTyVRdDPdhdxWLx85bQOa-Hxs97yi2yLh7_NymGNTZLrx1Y_nrqrDNw=s320&quot; width=&quot;320&quot; /&gt;&lt;/a&gt;&lt;/div&gt;&lt;p&gt;This paper builds on previous work published by the group, including our well cited &lt;i&gt;Tracing the source of campylobacteriosis&lt;/i&gt; (&lt;a href=&quot;https://journals.plos.org/plosgenetics/article?id=10.1371/journal.pgen.1000203&quot;&gt;Wilson et al 2008, &lt;i&gt;PLOS Genetics 4&lt;/i&gt;:e1000203&lt;/a&gt;). The use of these methods for tracing infection has influenced public health policy and &lt;a href=&quot;http://blog.danielwilson.me.uk/2009/11/campylobacter-source-attribution-in-new.html&quot;&gt;contributed to reducing disease burden&lt;/a&gt;.&lt;/p&gt;&lt;p&gt;This work demonstrates the potential for modern genomics and artificial intelligence approaches to address common and serious problems that affect our everyday lives. The awareness of the importance of infection to society has rarely been higher than in 2021, and while the current pandemic imposes an acute global problem, other infections continue to present long-term threats to health and productivity.&lt;/p&gt;&lt;div&gt;This work was led by &lt;a href=&quot;https://scholar.google.co.uk/citations?user=AJ3a3JkAAAAJ&amp;amp;hl=en&quot;&gt;Nicolas Arning&lt;/a&gt;, in collaboration with &lt;a href=&quot;https://eng.ox.ac.uk/people/david-clifton/&quot;&gt;David Clifton&lt;/a&gt; and &lt;a href=&quot;https://sheppardlab.com&quot;&gt;Sam Sheppard&lt;/a&gt;.&lt;/div&gt;&lt;div&gt;&lt;br /&gt;&lt;/div&gt;</description><link>http://blog.danielwilson.me.uk/2021/12/new-paper-machine-learning-to-predict.html</link><author>noreply@blogger.com (Daniel Wilson)</author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="https://blogger.googleusercontent.com/img/a/AVvXsEg5IaGadnQr7wCxPK-m3PQk6YrGwI4n4WDEcPtLhsRrQvBZP3ovcq5uOI3M-pw78WS3niSIJd7rYeqH79D07-7DqRgO_DMOECY3Q04S2NotmlgqnlGCEprPF383hc0wTyVRdDPdhdxWLx85bQOa-Hxs97yi2yLh7_NymGNTZLrx1Y_nrqrDNw=s72-c" height="72" width="72"/><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-3849771563401722970</guid><pubDate>Tue, 07 Dec 2021 11:54:00 +0000</pubDate><atom:updated>2021-12-07T06:14:08.292-06:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Antimicrobial resistance</category><category domain="http://www.blogger.com/atom/ns#">Bernadette Young</category><category domain="http://www.blogger.com/atom/ns#">GWAS</category><category domain="http://www.blogger.com/atom/ns#">Microbial Genomics</category><category domain="http://www.blogger.com/atom/ns#">Modernising Medical Microbiology</category><category domain="http://www.blogger.com/atom/ns#">Staphylococcus aureus</category><category domain="http://www.blogger.com/atom/ns#">Virulogenomics</category><title>New paper: Antimicrobial resistance determinants are associated with Staphylococcus aureus bacteraemia and adaptation to the healthcare environment</title><description>&lt;p&gt;&lt;i&gt;Staphylococcus aureus&lt;/i&gt;&amp;nbsp;is a leading cause of infectious disease deaths in all countries, with bloodstream infection leading to sepsis a major concern. This new study, published in November in &lt;i&gt;&lt;a href=&quot;https://www.microbiologyresearch.org/content/journal/mgen/10.1099/mgen.0.000700&quot;&gt;Microbial Genomics&lt;/a&gt;&lt;/i&gt;,&amp;nbsp;reports genes and genetic variants in &lt;i&gt;Staph.&amp;nbsp;aureus&lt;/i&gt; associated severe disease &lt;i&gt;vs&lt;/i&gt;&amp;nbsp;asymptomatic carriage, and healthcare &lt;i&gt;vs&lt;/i&gt;&amp;nbsp;community carriage.&lt;/p&gt;&lt;p&gt;Our genome-wide association study of 2000 bacterial genomes showed that antibiotic resistance in &lt;i&gt;Staph. aureus&lt;/i&gt; is associated with severe disease and the hospital environment:&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;ul style=&quot;text-align: left;&quot;&gt;&lt;li&gt;A mutation conferring trimethoprim resistance (&lt;i&gt;dfrB&amp;nbsp;&lt;/i&gt;F99Y) and the presence of a gene conferring methicillin resistance (&lt;i&gt;mecA&lt;/i&gt;) were both associated with bloodstream infection &lt;i&gt;vs&lt;/i&gt;&amp;nbsp;asymptomatic nose carriage.&lt;/li&gt;&lt;li&gt;Separately, we demonstrated that a mutation conferring fluoroquinolone resistance (&lt;i&gt;gyrA&lt;/i&gt;&amp;nbsp;L84S) and variation in a gene involved in resistance to multiple antibiotics (&lt;i&gt;prsA&lt;/i&gt;) were preferentially associated with healthcare-associated carriage&amp;nbsp;&lt;i&gt;vs&lt;/i&gt; community-acquired carriage.&lt;/li&gt;&lt;/ul&gt;&lt;p&gt;&lt;/p&gt;&lt;div&gt;The implication – that antibiotic resistance genes may provide survival advantages which mechanistically contribute to the development of disease – is important in the face of the continued global rise of&amp;nbsp;antibiotic resistance.&lt;/div&gt;&lt;div&gt;&lt;br /&gt;&lt;/div&gt;&lt;div class=&quot;separator&quot; style=&quot;clear: both; text-align: center;&quot;&gt;&lt;a href=&quot;https://www.microbiologyresearch.org/content/journal/mgen/10.1099/mgen.0.000700&quot; style=&quot;margin-left: 1em; margin-right: 1em;&quot;&gt;&lt;img border=&quot;0&quot; data-original-height=&quot;1983&quot; data-original-width=&quot;2048&quot; height=&quot;310&quot; src=&quot;https://blogger.googleusercontent.com/img/a/AVvXsEizC2MAVlUUS0AQ-TgcBncOFVncRkgXiB9XfnBD7tji0KVPKZ_L1AOMgWLbmrT-Z9Te5Di6bmeNxjZzx3O_IDroiXyu9F_BjC09O0H9QoBLa3XONhIlQqqPBdrTqSRIPmFnS9msIji5x5fmEFDlljrhzz6DcLHFaVWXaB44getCLlnVjttwtw=s320&quot; width=&quot;320&quot; /&gt;&lt;/a&gt;&lt;/div&gt;&lt;br /&gt;&lt;div&gt;We were also able to shed light on a controversy as to whether different strains of &lt;i&gt;Staph. aureus&lt;/i&gt;&amp;nbsp;differ in their propensity to cause severe disease. Interest in this question dates back decades in the literature, and contradictory studies, often based on modest sample sizes, have reached different conclusions. Our comparatively large study, using a whole-genome method that we previously published in &lt;i&gt;&lt;a href=&quot;https://pubmed.ncbi.nlm.nih.gov/27572646/&quot;&gt;Nature Microbiology&lt;/a&gt;&lt;/i&gt;, found that all strains of&amp;nbsp;&lt;i&gt;Staph. aureus&lt;/i&gt;&amp;nbsp;are equally likely to cause severe disease &lt;i&gt;vs&lt;/i&gt;&amp;nbsp;asymptomatic carriage.&lt;/div&gt;&lt;p&gt;&lt;br /&gt;&lt;/p&gt;&lt;p&gt;&lt;br /&gt;&lt;/p&gt;&lt;p&gt;&lt;br /&gt;&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2021/12/new-paper-antimicrobial-resistance.html</link><author>noreply@blogger.com (Daniel Wilson)</author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="https://blogger.googleusercontent.com/img/a/AVvXsEizC2MAVlUUS0AQ-TgcBncOFVncRkgXiB9XfnBD7tji0KVPKZ_L1AOMgWLbmrT-Z9Te5Di6bmeNxjZzx3O_IDroiXyu9F_BjC09O0H9QoBLa3XONhIlQqqPBdrTqSRIPmFnS9msIji5x5fmEFDlljrhzz6DcLHFaVWXaB44getCLlnVjttwtw=s72-c" height="72" width="72"/><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-7172144444987765708</guid><pubDate>Tue, 07 Dec 2021 11:19:00 +0000</pubDate><atom:updated>2021-12-07T06:14:30.175-06:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Christoph Tang</category><category domain="http://www.blogger.com/atom/ns#">GWAS</category><category domain="http://www.blogger.com/atom/ns#">Martin Maiden</category><category domain="http://www.blogger.com/atom/ns#">Neisseria meningitidis</category><category domain="http://www.blogger.com/atom/ns#">PLoS Pathogens</category><category domain="http://www.blogger.com/atom/ns#">Sarah Earle</category><category domain="http://www.blogger.com/atom/ns#">Virulogenomics</category><title>New paper: Genome-wide association studies reveal the role of polymorphisms affecting factor H binding protein expression in host invasion by Neisseria meningitidis</title><description>&lt;p&gt;In this paper, published in October in &lt;i&gt;&lt;a href=&quot;https://journals.plos.org/plospathogens/article?id=10.1371/journal.ppat.1009992&quot;&gt;PLOS Pathogens&lt;/a&gt;&lt;/i&gt;, we discovered a novel genetic association between life-threatening invasive &lt;a href=&quot;https://en.wikipedia.org/wiki/Meningococcal_disease&quot;&gt;meningococcal disease&lt;/a&gt; (IMD) and bacterial genetic variation in factor H binding protein (fHbp) through two bacterial genome-wide association studies (&lt;a href=&quot;https://en.wikipedia.org/wiki/Genome-wide_association_study&quot;&gt;GWAS&lt;/a&gt;), which we validated experimentally. This was a collaboration with the groups of&amp;nbsp;&lt;a href=&quot;https://www.path.ox.ac.uk/content/christoph-tang&quot;&gt;Chris Tang&lt;/a&gt;&amp;nbsp;and&amp;nbsp;&lt;a href=&quot;https://www.zoo.ox.ac.uk/people/professor-martin-maiden?filter_types-1889262[]=&amp;amp;filter_series-1889262[]=&quot;&gt;Martin Maiden&lt;/a&gt;, with the work in my group led by &lt;a href=&quot;https://www.researchgate.net/profile/Sarah-Earle-2&quot;&gt;Sarah Earle&lt;/a&gt;.&lt;/p&gt;&lt;p&gt;fHbp is an important component of meningococcal vaccines that directly interacts with human complement factor H (CFH). Intriguingly, our discovery that bacterial genetic variation in fHbp associates with increased virulence mirrors an earlier discovery that human genetic variation in CFH associates with increased susceptibility to IMD (&lt;a href=&quot;https://pubmed.ncbi.nlm.nih.gov/20694013/&quot;&gt;&lt;i&gt;Nature Genetics&lt;/i&gt; 42: 772&lt;/a&gt;).&lt;/p&gt;&lt;p&gt;Our experiments showed that the fHbp risk allele increased expression. Interestingly, increased susceptibility to IMD has been previously associated with elevated CFH expression. Therefore over-expression of either fHbp by the bacterium or CFH by the host appears to increase the risk of IMD. Since complement evasion is necessary for pathogenesis, these insights offer new leads for improving treatment.&lt;/p&gt;&lt;p&gt;Key results from the paper:&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;ul style=&quot;text-align: left;&quot;&gt;&lt;li&gt;A GWAS for IMD in 261 meningococci from the Czech Republic highlighted a highly polygenic architecture of meningococcal virulence (see Figure), including capsule biosynthesis genes, the meningococcal disease association island and the new signal near the &lt;i&gt;fba&lt;/i&gt;&amp;nbsp;and&amp;nbsp;&lt;i&gt;fHbp&lt;/i&gt; genes.&lt;/li&gt;&lt;li&gt;A replication GWAS for IMD in 1295 meningococcal genomes belonging to strain ST41/44 downloaded from &lt;a href=&quot;http://pubMLST.org&quot;&gt;pubMLST.org&lt;/a&gt; validated the novel signal of association near &lt;i&gt;fba&lt;/i&gt; and &lt;i&gt;fHbp&lt;/i&gt;.&lt;/li&gt;&lt;li&gt;SHAPE reactivity analyses revealed that IMD-associated variation in the regulatory region of &lt;i&gt;fHbp&lt;/i&gt; disrupted the ability of the cell machinery to commence gene expression.&lt;/li&gt;&lt;li&gt;Flow cytometry assays of newly constructed genetically engineered strains, in different temperatures and in the presence and absence of human serum, attributed changes in gene expression to a non-synonymous candidate mutation in the &lt;i&gt;fHbp&lt;/i&gt; gene.&lt;/li&gt;&lt;/ul&gt;&lt;p&gt;&lt;/p&gt;&lt;p&gt;In this study, our GWAS relied exclusively on publicly available genome sequences and metadata, highlighting the untapped potential of large-scale open source databases like &lt;a href=&quot;http://pubMLST.org&quot;&gt;pubMLST.org&lt;/a&gt;, and the value of big data for improving our understanding of disease.&lt;/p&gt;&lt;div class=&quot;separator&quot; style=&quot;clear: both; text-align: center;&quot;&gt;&lt;a href=&quot;https://journals.plos.org/plospathogens/article?id=10.1371/journal.ppat.1009992&quot; style=&quot;margin-left: 1em; margin-right: 1em;&quot;&gt;&lt;img border=&quot;0&quot; data-original-height=&quot;1511&quot; data-original-width=&quot;2048&quot; height=&quot;472&quot; src=&quot;https://blogger.googleusercontent.com/img/a/AVvXsEjQN_5reKJtPGPOjmK8_dkorLf6gGsY0987whsubI4r1T42S8TrGx7PodzHmNfdbXOZIPGNtk9JdHcjH6ESmb0YCbTKFHF6WgqEG4aSs7HdgpyFucbqUYBBH8tpHMDy_ZvkoyA7fbflSsmgAP80_kohACJUHaDDYX-vSgvbYIjpYxXV4OWxyw=w640-h472&quot; width=&quot;640&quot; /&gt;&lt;/a&gt;&lt;/div&gt;&lt;br /&gt;&lt;div&gt;&lt;br /&gt;&lt;/div&gt;</description><link>http://blog.danielwilson.me.uk/2021/12/new-paper-genome-wide-association.html</link><author>noreply@blogger.com (Daniel Wilson)</author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="https://blogger.googleusercontent.com/img/a/AVvXsEjQN_5reKJtPGPOjmK8_dkorLf6gGsY0987whsubI4r1T42S8TrGx7PodzHmNfdbXOZIPGNtk9JdHcjH6ESmb0YCbTKFHF6WgqEG4aSs7HdgpyFucbqUYBBH8tpHMDy_ZvkoyA7fbflSsmgAP80_kohACJUHaDDYX-vSgvbYIjpYxXV4OWxyw=s72-w640-h472-c" height="72" width="72"/><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-4488636967422177624</guid><pubDate>Tue, 13 Apr 2021 09:19:00 +0000</pubDate><atom:updated>2021-04-13T04:19:30.552-05:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Big Data Institute</category><category domain="http://www.blogger.com/atom/ns#">Data Science</category><category domain="http://www.blogger.com/atom/ns#">Harmonic mean p-value</category><category domain="http://www.blogger.com/atom/ns#">Postdoc</category><category domain="http://www.blogger.com/atom/ns#">Public Health England</category><category domain="http://www.blogger.com/atom/ns#">Recruitment</category><title>New positions: Data Scientist in Public Health Epidemiology and Postdoc in Statistical Methods</title><description>&lt;p&gt;I am looking to fill two positions at the&amp;nbsp;&lt;a href=&quot;https://www.bdi.ox.ac.uk&quot;&gt;Big Data Institute&lt;/a&gt;,&amp;nbsp;&lt;a href=&quot;https://www.ndph.ox.ac.uk&quot;&gt;Nuffield Department of Population Health&lt;/a&gt;,&amp;nbsp;&lt;a href=&quot;http://www.ox.ac.uk&quot;&gt;University of Oxford&lt;/a&gt;:&amp;nbsp;a &lt;a href=&quot;https://my.corehr.com/pls/uoxrecruit/erq_jobspec_version_4.display_form?p_company=10&amp;amp;p_internal_external=E&amp;amp;p_display_in_irish=N&amp;amp;p_process_type=&amp;amp;p_applicant_no=&amp;amp;p_form_profile_detail=&amp;amp;p_display_apply_ind=Y&amp;amp;p_refresh_search=Y&amp;amp;p_recruitment_id=149906&quot;&gt;Data Scientist in Public Health Epidemiology&lt;/a&gt; and&amp;nbsp;a &lt;a href=&quot;https://my.corehr.com/pls/uoxrecruit/erq_jobspec_version_4.display_form?p_company=10&amp;amp;p_internal_external=E&amp;amp;p_display_in_irish=N&amp;amp;p_process_type=&amp;amp;p_applicant_no=&amp;amp;p_form_profile_detail=&amp;amp;p_display_apply_ind=Y&amp;amp;p_refresh_search=Y&amp;amp;p_recruitment_id=149868&quot;&gt;Postdoctoral Researcher in Statistical Methods&lt;/a&gt;.&lt;/p&gt;&lt;p&gt;The Big Data Institute (BDI) is an interdisciplinary research centre that develops, evaluates and deploys efficient methods for acquiring and analysing biomedical data at scale and for exploiting the opportunities arising from such studies. The Nuffield Department of Population Health (NDPH), a key partner in the BDI, contains world-renowned population health research groups and is an excellent environment for multi-disciplinary teaching and research. &amp;nbsp;&lt;/p&gt;&lt;p&gt;The role of the&amp;nbsp;&lt;a href=&quot;https://my.corehr.com/pls/uoxrecruit/erq_jobspec_version_4.display_form?p_company=10&amp;amp;p_internal_external=E&amp;amp;p_display_in_irish=N&amp;amp;p_process_type=&amp;amp;p_applicant_no=&amp;amp;p_form_profile_detail=&amp;amp;p_display_apply_ind=Y&amp;amp;p_refresh_search=Y&amp;amp;p_recruitment_id=149906&quot;&gt;Data Scientist in Public Health Epidemiology&lt;/a&gt;&amp;nbsp;is to help pilot a project developing systems for continuous record linkage between a large &lt;a href=&quot;https://www.gov.uk/government/organisations/public-health-england&quot;&gt;Public Health England&lt;/a&gt; (PHE) data source and other population health records, with the aim of facilitating research into infectious diseases.&lt;/p&gt;&lt;p&gt;The post holder will manage and develop record linkage algorithms comparing records with relational databases containing health records via appropriate anonymization protocols, and manage and develop systems for identifying incoming records of interest, for near-real time updating of SQL databases, and for issuing email and SMS alerts in response to these events. The responsibilities will also include contributing to large-scale statistical studies using public health records to investigate disease epidemiology, and analysing and interpreting results, reviewing and refining working hypotheses, writing reports and presenting findings to colleagues.&lt;/p&gt;&lt;p&gt;To be considered, applicants will hold a degree in Computer Science, Data Science, Statistics, or another relevant subject with a strong quantitative component, or have equivalent experience. They will also need an understanding of relational database construction and SQL queries, experience coding in at least one common programming language (e.g. C#, Java, Python) and good interpersonal skills with the ability to work closely with others as part of a team, while taking personal responsibility for assigned tasks.&lt;/p&gt;&lt;p&gt;The role of the&amp;nbsp;&lt;a href=&quot;https://my.corehr.com/pls/uoxrecruit/erq_jobspec_version_4.display_form?p_company=10&amp;amp;p_internal_external=E&amp;amp;p_display_in_irish=N&amp;amp;p_process_type=&amp;amp;p_applicant_no=&amp;amp;p_form_profile_detail=&amp;amp;p_display_apply_ind=Y&amp;amp;p_refresh_search=Y&amp;amp;p_recruitment_id=149868&quot;&gt;Postdoctoral Researcher in Statistical Methods&lt;/a&gt;&amp;nbsp;is to develop statistical methods based on the &lt;a href=&quot;http://www.danielwilson.me.uk/abstracts/wilson_2019.html&quot;&gt;harmonic mean &lt;i&gt;p&lt;/i&gt;-value&lt;/a&gt; (HMP) approach. The HMP bridges classical and Bayesian approaches to model-averaged hypothesis testing, with applications to very large-scale data analysis problems in biomedical science.&lt;/p&gt;&lt;p&gt;The post holder will join a team with expertise in statistical inference, population genetics, genomics, evolution, epidemiology and infectious disease. The responsibilities will include developing statistical methods based on the HMP, undertaking research under the direction of the principal investigator, helping with supervision within the project as required, driving forward manuscripts for publication in collaboration with group members and disseminating results through other means such as academic conferences.&lt;/p&gt;&lt;p&gt;To be considered, applicants will hold, or be close to completion of, a PhD/DPhil involving statistical methods development and a track record of publication-quality methods development in statistical theory or methods development. The ability to work independently in pursuing the goals of an agreed research plan and excellent interpersonal skills and the ability to work closely with others as a team are also essential.&lt;/p&gt;&lt;p&gt;&lt;b&gt;The closing date for both positions is noon on the 5th May 2021&lt;/b&gt;. Only applications received through the online system will be considered:&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;ul style=&quot;text-align: left;&quot;&gt;&lt;li&gt;Click here to apply for the&amp;nbsp;&lt;a href=&quot;https://my.corehr.com/pls/uoxrecruit/erq_jobspec_version_4.display_form?p_company=10&amp;amp;p_internal_external=E&amp;amp;p_display_in_irish=N&amp;amp;p_process_type=&amp;amp;p_applicant_no=&amp;amp;p_form_profile_detail=&amp;amp;p_display_apply_ind=Y&amp;amp;p_refresh_search=Y&amp;amp;p_recruitment_id=149906&quot;&gt;Data Scientist in Public Health Epidemiology&lt;/a&gt;&amp;nbsp;position&lt;/li&gt;&lt;li&gt;Click here to apply for the&amp;nbsp;&lt;a href=&quot;https://my.corehr.com/pls/uoxrecruit/erq_jobspec_version_4.display_form?p_company=10&amp;amp;p_internal_external=E&amp;amp;p_display_in_irish=N&amp;amp;p_process_type=&amp;amp;p_applicant_no=&amp;amp;p_form_profile_detail=&amp;amp;p_display_apply_ind=Y&amp;amp;p_refresh_search=Y&amp;amp;p_recruitment_id=149868&quot;&gt;Postdoctoral Researcher in Statistical Methods&lt;/a&gt;&amp;nbsp;position&lt;/li&gt;&lt;/ul&gt;&lt;p&gt;&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2021/04/new-positions-data-scientist-in-public.html</link><author>noreply@blogger.com (Daniel Wilson)</author><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-6572981457781929413</guid><pubDate>Tue, 13 Apr 2021 09:06:00 +0000</pubDate><atom:updated>2021-04-13T04:06:49.920-05:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">COVID-19</category><category domain="http://www.blogger.com/atom/ns#">COVID-19 Host Genetics Initiative</category><category domain="http://www.blogger.com/atom/ns#">Presentations</category><title>Presentation: Genome-wide association studies of COVID-19</title><description>&lt;p&gt;An updated version of this talk given at the Nuffield Department for Population Health&#39;s annual symposium 2021:&lt;/p&gt;
&lt;iframe allow=&quot;accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture&quot; allowfullscreen=&quot;&quot; frameborder=&quot;0&quot; height=&quot;315&quot; src=&quot;https://www.youtube.com/embed/DCqrz1nZZAM&quot; title=&quot;YouTube video player&quot; width=&quot;560&quot;&gt;&lt;/iframe&gt;
</description><link>http://blog.danielwilson.me.uk/2021/04/presentation-genome-wide-association.html</link><author>noreply@blogger.com (Daniel Wilson)</author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="https://img.youtube.com/vi/DCqrz1nZZAM/default.jpg" height="72" width="72"/><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-6382574023546435359</guid><pubDate>Mon, 07 Sep 2020 09:47:00 +0000</pubDate><atom:updated>2020-09-07T04:47:51.111-05:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">Genomics</category><category domain="http://www.blogger.com/atom/ns#">Postdoc</category><category domain="http://www.blogger.com/atom/ns#">Recruitment</category><category domain="http://www.blogger.com/atom/ns#">Statistics</category><title>Postdoc position available in Statistical Genomics</title><description>&lt;p&gt;I am seeking someone with a track record in methods development for Statistical Genomics and an interest in Infectious Disease to join the group. The aim of the post is to conduct innovative research within the group&#39;s range of interests and to make use of the opportunities afforded by our outstanding collaborators. I would welcome candidates who wish to use the opportunity as a stepping stone to independent funding.&lt;/p&gt;&lt;p&gt;The postdoc will join a team with expertise in microbiology, genomics, evolution, population genetics and statistical inference. Responsibilities will include planning a research project and milestones with help and guidance from the group, preparing manuscripts for publication, keeping records of results and methods and tracking milestones, and disseminating results, including through academic conferences.&lt;/p&gt;&lt;p&gt;We will consider applicants who hold, or are close to completion of, a PhD/DPhil involving statistical methods development, and who have experience of large-scale statistical data analysis, evidence of originating and executing independent academic research ideas, excellent interpersonal skills and the ability to work closely with others in a team.&lt;/p&gt;&lt;p&gt;The position is advertised to 31 December 2021. The application deadline is noon on Thursday 1st October 2020. &lt;a href=&quot;https://my.corehr.com/pls/uoxrecruit/erq_jobspec_details_form.jobspec?p_id=147494&quot;&gt;Visit the University recruitment page to apply&lt;/a&gt;.&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2020/09/postdoc-position-available-in.html</link><author>noreply@blogger.com (Daniel Wilson)</author><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-2596218484259200329</guid><pubDate>Fri, 21 Aug 2020 17:38:00 +0000</pubDate><atom:updated>2020-08-21T12:38:10.861-05:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">COVID-19</category><category domain="http://www.blogger.com/atom/ns#">Presentations</category><category domain="http://www.blogger.com/atom/ns#">UK Biobank</category><title>Presentation: Genome-wide Association Studies of COVID-19</title><description>&lt;p&gt;An online recording of the talk about Genome-wide Association Studies of COVID-19 at the UK Biobank 2020 meeting on 23 June 2020. The &lt;a href=&quot;https://gateway.on24.com/wcc/eh/2386491/Scientific+Conference+2020&quot;&gt;full conference&lt;/a&gt; is also online.&lt;/p&gt;&lt;div class=&quot;separator&quot; style=&quot;clear: both; text-align: center;&quot;&gt;&lt;iframe allowfullscreen=&quot;&quot; class=&quot;BLOG_video_class&quot; height=&quot;480&quot; src=&quot;https://www.youtube.com/embed/d7khyysm-As&quot; width=&quot;640&quot; youtube-src-id=&quot;d7khyysm-As&quot;&gt;&lt;/iframe&gt;&lt;/div&gt;&lt;p&gt;&lt;br /&gt;&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2020/08/presentation-genome-wide-association.html</link><author>noreply@blogger.com (Daniel Wilson)</author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="https://img.youtube.com/vi/d7khyysm-As/default.jpg" height="72" width="72"/><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-590332985273532077</guid><pubDate>Fri, 21 Aug 2020 17:30:00 +0000</pubDate><atom:updated>2020-08-21T12:33:10.315-05:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">COVID-19</category><category domain="http://www.blogger.com/atom/ns#">COVID-19 Host Genetics Initiative</category><category domain="http://www.blogger.com/atom/ns#">Epidemiology</category><category domain="http://www.blogger.com/atom/ns#">GWAS</category><category domain="http://www.blogger.com/atom/ns#">Machine learning</category><category domain="http://www.blogger.com/atom/ns#">Microbial Genomics</category><category domain="http://www.blogger.com/atom/ns#">New England Journal of Medicine</category><category domain="http://www.blogger.com/atom/ns#">Public Health England</category><category domain="http://www.blogger.com/atom/ns#">Statistics</category><category domain="http://www.blogger.com/atom/ns#">UK Biobank</category><category domain="http://www.blogger.com/atom/ns#">Wellcome Open Research</category><title>The group&#39;s research response to COVID-19</title><description>&lt;p&gt;&lt;span style=&quot;font-family: inherit;&quot;&gt;This is an update on the group&#39;s research response to the COVID-19 pandemic. As an infectious disease group we have been keen to contribute to the international research effort where we could be useful, while recognising the need to continue our research on other important infections where possible.&lt;/span&gt;&lt;/p&gt;&lt;ul&gt;&lt;li style=&quot;margin-left: 15px;&quot;&gt;&lt;span&gt;&lt;b style=&quot;caret-color: rgb(34, 34, 34); color: #222222; font-family: inherit;&quot;&gt;Bugbank&lt;/b&gt;&lt;span style=&quot;color: #222222; font-family: inherit;&quot;&gt;&lt;span style=&quot;caret-color: rgb(34, 34, 34);&quot;&gt;. Thanks to a pre-existing collaboration between our group, &lt;a href=&quot;https://www.gov.uk/government/organisations/public-health-england&quot;&gt;Public Health England&lt;/a&gt; and &lt;a href=&quot;https://www.ukbiobank.ac.uk&quot;&gt;UK Biobank&lt;/a&gt;, we were in a position to help rapidly facilitate COVID-19 research via SARS-CoV-2 PCR-based swab test results. Beginning mid-March, we worked to provide regular (usually weekly) updates of tests results, which were made available to all UK Biobank researchers beginning April 17th. This is &lt;a href=&quot;http://www.bbc.co.uk/news/health-52243605&quot;&gt;one of several resources&lt;/a&gt; &lt;/span&gt;&lt;/span&gt;&lt;span style=&quot;color: #222222; font-family: inherit;&quot;&gt;&lt;span style=&quot;caret-color: rgb(34, 34, 34);&quot;&gt;on COVID-19 linked to UK Biobank. Beginning in May we provided feeds to other cohorts:&amp;nbsp;&lt;/span&gt;&lt;/span&gt;&lt;span style=&quot;color: #222222;&quot;&gt;&lt;span style=&quot;caret-color: rgb(34, 34, 34);&quot;&gt;&lt;a href=&quot;www.donor- health-btru.nihr.ac.uk&quot;&gt;INTERVAL&lt;/a&gt;, &lt;a href=&quot;www.donor- health-btru.nihr.ac.uk&quot;&gt;COMPARE&lt;/a&gt;, &lt;a href=&quot;www.genesand- health.org&quot;&gt;Genes &amp;amp; Health&lt;/a&gt; and the &lt;a href=&quot;bioresource.nihr. ac.uk&quot;&gt;NIHR BioResource&lt;/a&gt;.&lt;/span&gt;&lt;/span&gt;&lt;span style=&quot;color: #222222; font-family: inherit;&quot;&gt;&lt;span style=&quot;caret-color: rgb(34, 34, 34);&quot;&gt;&amp;nbsp;We provide updates on this work through the project website&amp;nbsp;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;a data-saferedirecturl=&quot;https://www.google.com/url?q=http://www.bugbank.uk&amp;amp;source=gmail&amp;amp;ust=1598109203600000&amp;amp;usg=AFQjCNFfq0x-WO3D3nhydDMBgRVeW5wigA&quot; href=&quot;http://www.bugbank.uk/&quot; style=&quot;caret-color: rgb(34, 34, 34); color: #1155cc; font-family: inherit;&quot; target=&quot;_blank&quot;&gt;www.bugbank.uk&lt;/a&gt;&lt;span style=&quot;caret-color: rgb(34, 34, 34); color: #222222; font-family: inherit;&quot;&gt;. We have published a paper describing the dynamic data linkage in &lt;a href=&quot;https://www.microbiologyresearch.org/content/journal/mgen/10.1099/mgen.0.000397&quot; style=&quot;font-style: italic;&quot;&gt;Microbial Genomics&lt;/a&gt;&amp;nbsp;(&lt;a href=&quot;https://microbiologysociety.org/news/press-releases/repurposing-public-health-systems-to-decode-covid-19.html&quot;&gt;press release&lt;/a&gt;).&lt;/span&gt;&lt;span style=&quot;caret-color: rgb(34, 34, 34); color: #222222; font-family: inherit;&quot;&gt;&amp;nbsp;Key collaborators in this project are &lt;a href=&quot;https://www.bdi.ox.ac.uk/Team/jacob-armstrong&quot;&gt;Jacob Armstrong&lt;/a&gt;&amp;nbsp;(Big Data Institute)&amp;nbsp;&lt;a href=&quot;https://www.ndph.ox.ac.uk/team/naomi-allen&quot;&gt;Naomi Allen&lt;/a&gt;&amp;nbsp;(UK Biobank) and&amp;nbsp;&lt;a href=&quot;https://www.ndm.ox.ac.uk/principal-investigators/researcher/david-wyllie&quot;&gt;David Wyllie&lt;/a&gt; and Anne Marie O&#39;Connell (Public Health England).&lt;/span&gt;&lt;/li&gt;&lt;/ul&gt;&lt;div&gt;&lt;span style=&quot;color: #222222;&quot;&gt;&lt;span style=&quot;caret-color: rgb(34, 34, 34);&quot;&gt;&lt;br /&gt;&lt;/span&gt;&lt;/span&gt;&lt;/div&gt;&lt;ul style=&quot;caret-color: rgb(34, 34, 34); color: #222222;&quot;&gt;&lt;li style=&quot;margin-left: 15px;&quot;&gt;&lt;span style=&quot;font-family: inherit;&quot;&gt;&lt;b&gt;COVID-19 Host Genetics Initiative&lt;/b&gt;. Along with groups at &lt;a href=&quot;https://www.mcgill.ca/genepi/&quot;&gt;McGill&lt;/a&gt; and the&amp;nbsp;&lt;a href=&quot;https://www.broadinstitute.org/bios/benjamin-neale&quot;&gt;Broad Institute&lt;/a&gt;, I have contributed analyses of UK Biobank&lt;/span&gt;&lt;span style=&quot;font-family: inherit;&quot;&gt;&amp;nbsp;to investigate genetic risk factors for COVID-19. The &lt;a href=&quot;https://www.nature.com/articles/s41431-020-0636-6&quot;&gt;Host Genetics Initiative&lt;/a&gt; is drawing on more than 200 cohorts from around the world to conduct&amp;nbsp;&lt;/span&gt;&lt;span style=&quot;font-family: inherit;&quot;&gt;meta-analysis to tackle questions such as &lt;a href=&quot;https://www.washingtonpost.com/opinions/2020/04/27/covid-19-quickly-kills-some-while-others-dont-show-symptoms-can-genetics-explain-this/&quot;&gt;why some people suffer severe COVID-19&lt;/a&gt; while others get mild or asymptomatic infection (&lt;a href=&quot;https://www.ft.com/content/50006fa2-f99c-4da8-b817-abb2379565ce&quot;&gt;media coverage&lt;/a&gt;). The meta-analysis results are &lt;a href=&quot;https://www.covid19hg.org/results/&quot;&gt;publicly released&lt;/a&gt; periodically. This led to the independent replication of a genetic risk factor on chromosome 3 discovered by a Spanish-Italian cohort and published in the &lt;i&gt;&lt;a href=&quot;https://www.nejm.org/doi/full/10.1056/NEJMoa2020283&quot;&gt;New England Journal of Medicine&lt;/a&gt;&lt;/i&gt;.&lt;/span&gt;&lt;/li&gt;&lt;/ul&gt;&lt;div&gt;&lt;span style=&quot;color: #222222;&quot;&gt;&lt;span style=&quot;caret-color: rgb(34, 34, 34);&quot;&gt;&lt;br /&gt;&lt;/span&gt;&lt;/span&gt;&lt;/div&gt;&lt;ul style=&quot;caret-color: rgb(34, 34, 34); color: #222222;&quot;&gt;&lt;li style=&quot;margin-left: 15px;&quot;&gt;&lt;b&gt;Epidemiological risk factors for COVID-19&lt;/b&gt;. Graduate&amp;nbsp;student &lt;a href=&quot;https://www.bdi.ox.ac.uk/Team/nicolas-arning&quot;&gt;Nicolas Arning&lt;/a&gt; and I are developing an approach to quantify the effects of lifestyle and medical risk factors for COVID-19 in the UK Biobank that accounts for inherent uncertainty in which risk factors to consider. The new method employs the &lt;a href=&quot;https://www.pnas.org/content/116/4/1195&quot;&gt;harmonic mean &lt;i&gt;p&lt;/i&gt;-value&lt;/a&gt;, a model-averaging approach for big data that we published&amp;nbsp;previously. We are in the process of evaluating the performance of the approach, comparing it to machine learning, and interpreting the results.&lt;/li&gt;&lt;/ul&gt;&lt;div&gt;&lt;span style=&quot;color: #222222;&quot;&gt;&lt;span style=&quot;caret-color: rgb(34, 34, 34);&quot;&gt;&lt;br /&gt;&lt;/span&gt;&lt;/span&gt;&lt;/div&gt;&lt;ul style=&quot;caret-color: rgb(34, 34, 34); color: #222222;&quot;&gt;&lt;li style=&quot;margin-left: 15px;&quot;&gt;&lt;span style=&quot;font-family: inherit;&quot;&gt;&lt;b&gt;Antibody testing for the UK Government&lt;/b&gt;. Postdoc &lt;a href=&quot;https://oxford.academia.edu/JustineRudkin&quot;&gt;Justine Rudkin&lt;/a&gt; has been working in the lab with &lt;a href=&quot;https://www.ndm.ox.ac.uk/principal-investigators/researcher/derrick-crook&quot;&gt;Derrick Crook&lt;/a&gt;, &lt;a href=&quot;https://www.medsci.ox.ac.uk/divisional-services/staff/regius&quot;&gt;Sir John Bell&lt;/a&gt; and others to measure the efficacy of antibody tests for the UK Government. They have tested many hundreds of kits to establish the sensitivity and specificity of the tests to help evaluate the utility of a national testing programme. This work was crucial in demonstrating the &lt;a href=&quot;https://www.theguardian.com/world/2020/apr/09/uk-government-urged-to-abandon-poor-finger-prick-antibody-tests-coronavirus&quot;&gt;limitations&lt;/a&gt; of early blood-spot based tests, and the credibility of subsequent generations of antibody tests. The work has been published in &lt;a href=&quot;https://wellcomeopenresearch.org/articles/5-139&quot;&gt;&lt;i&gt;Wellcome Open Research&lt;/i&gt;&lt;/a&gt;.&lt;/span&gt;&lt;/li&gt;&lt;/ul&gt;&lt;div&gt;&lt;span style=&quot;color: #222222;&quot;&gt;&lt;span style=&quot;caret-color: rgb(34, 34, 34);&quot;&gt;&lt;br /&gt;&lt;/span&gt;&lt;/span&gt;&lt;/div&gt;&lt;ul style=&quot;caret-color: rgb(34, 34, 34); color: #222222;&quot;&gt;&lt;li style=&quot;margin-left: 15px;&quot;&gt;&lt;span style=&quot;font-family: inherit;&quot;&gt;&lt;b&gt;Office of National Statistics Antibody Survey&lt;/b&gt;. Justine has also been working in the lab with &lt;a href=&quot;https://www.ndm.ox.ac.uk/team/ann-sarah-walker&quot;&gt;Sarah Walker&lt;/a&gt; to set up robots for her large &lt;a href=&quot;https://www.express.co.uk/news/uk/1274486/coronavirus-test-uk-expert-warning-covid-19-update-boris-johnson&quot;&gt;antibody testing cohort study&lt;/a&gt;. Sarah is leading an infection survey with the &lt;a href=&quot;https://www.ons.gov.uk/peoplepopulationandcommunity/healthandsocialcare/conditionsanddiseases/bulletins/coronaviruscovid19infectionsurveypilot/englandandwales21august2020&quot;&gt;Office of National Statistics&lt;/a&gt; to investigate exposure to SARS-CoV-2 in England and Wales.&lt;/span&gt;&lt;/li&gt;&lt;/ul&gt;&lt;div&gt;&lt;span style=&quot;color: #222222;&quot;&gt;&lt;span style=&quot;caret-color: rgb(34, 34, 34);&quot;&gt;&lt;br /&gt;&lt;/span&gt;&lt;/span&gt;&lt;/div&gt;&lt;div&gt;&lt;span style=&quot;caret-color: rgb(34, 34, 34); color: #222222;&quot;&gt;Work on other infections that has continued during the lockdown. Postdoc &lt;a href=&quot;https://twitter.com/sgearle?lang=en&quot;&gt;Sarah Earle&lt;/a&gt; continues research into pathogen genetic risk factors for diseases including tuberculosis and meningococcal meningitis, while &lt;a href=&quot;https://www.well.ox.ac.uk/current-students/shang-kuan-lin&quot;&gt;Steven Lin&lt;/a&gt; has continued to pursue work on hepatitis C virus genetics and epidemiology. Many of our close collaborators are infection doctors and they have of course been recalled to clinical duties. Laboratory work in the group has been severely disrupted, particularly several of Justine&#39;s &lt;i&gt;Staphylococcus aureus&lt;/i&gt;&amp;nbsp;projects. We are keen to pick up on those projects where we left off when the chance arrives.&lt;/span&gt;&lt;/div&gt;</description><link>http://blog.danielwilson.me.uk/2020/08/the-groups-research-response-to-covid-19.html</link><author>noreply@blogger.com (Daniel Wilson)</author><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-1254851838825467009</guid><pubDate>Fri, 21 Aug 2020 17:21:00 +0000</pubDate><atom:updated>2020-08-21T12:21:26.426-05:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">COVID-19</category><category domain="http://www.blogger.com/atom/ns#">Epidemiology</category><category domain="http://www.blogger.com/atom/ns#">lockdown</category><category domain="http://www.blogger.com/atom/ns#">Phylogenetics</category><category domain="http://www.blogger.com/atom/ns#">Teaching</category><category domain="http://www.blogger.com/atom/ns#">Zika virus</category><title>Teaching: Online lectures and practical on Phylogenetics in Practice</title><description>&lt;p&gt;On March 16th, we were in the interesting position of running an infectious disease course at the Big Data Institute on the day the &lt;a href=&quot;https://www.gov.uk/government/speeches/pm-statement-on-coronavirus-16-march-2020&quot;&gt;national lockdown was announced&lt;/a&gt; in response to the COVID-19 pandemic. As a result, we were among the first in the university to do remote teaching, something &lt;a href=&quot;https://www.bdi.ox.ac.uk/Team/katrina-lythgoe&quot;&gt;Katrina Lythgoe&lt;/a&gt; and the rest of us had prepared for in anticipation of the lockdown a week earlier &lt;a href=&quot;https://www.theguardian.com/world/2020/jun/10/uk-coronavirus-lockdown-20000-lives-boris-johnson-neil-ferguson&quot;&gt;that never happened&lt;/a&gt;.&lt;/p&gt;&lt;p&gt;These are the two online lectures in the &lt;a href=&quot;https://www.ox.ac.uk/admissions/graduate/courses/health-data-science&quot;&gt;Health Data Sciences CDT&lt;/a&gt; that I gave called &lt;i&gt;Phylogenetics in Practice&lt;/i&gt;.&lt;/p&gt;&lt;div class=&quot;separator&quot; style=&quot;clear: both; text-align: center;&quot;&gt;&lt;iframe allowfullscreen=&quot;&quot; class=&quot;BLOG_video_class&quot; height=&quot;281&quot; src=&quot;https://www.youtube.com/embed/OHiYkeeKN2Y&quot; width=&quot;640&quot; youtube-src-id=&quot;OHiYkeeKN2Y&quot;&gt;&lt;/iframe&gt;&lt;/div&gt;&lt;div class=&quot;separator&quot; style=&quot;clear: both; text-align: center;&quot;&gt;&lt;br /&gt;&lt;/div&gt;&lt;div class=&quot;separator&quot; style=&quot;clear: both; text-align: center;&quot;&gt;&lt;iframe allowfullscreen=&quot;&quot; class=&quot;BLOG_video_class&quot; height=&quot;281&quot; src=&quot;https://www.youtube.com/embed/OjbXutZ1IC8&quot; width=&quot;640&quot; youtube-src-id=&quot;OjbXutZ1IC8&quot;&gt;&lt;/iframe&gt;&lt;/div&gt;&lt;p&gt;The online practical, which applies phylogenetics approaches to understand the Zika virus epidemic, is implemented as a &lt;a href=&quot;https://hub.docker.com/repository/docker/dannywilson/teaching-phylogenetics&quot;&gt;Docker container&lt;/a&gt;, and available &lt;a href=&quot;http://www.popgen101.com/2018/11/phylogenetics-i-zika-virus-outbreak.html&quot;&gt;here&lt;/a&gt;.&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2020/08/teaching-online-lectures-and-practical.html</link><author>noreply@blogger.com (Daniel Wilson)</author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="https://img.youtube.com/vi/OHiYkeeKN2Y/default.jpg" height="72" width="72"/><thr:total>0</thr:total></item><item><guid isPermaLink="false">tag:blogger.com,1999:blog-8099840.post-4125501348553039444</guid><pubDate>Fri, 21 Aug 2020 14:30:00 +0000</pubDate><atom:updated>2020-08-21T09:52:55.234-05:00</atom:updated><category domain="http://www.blogger.com/atom/ns#">COVID-19</category><category domain="http://www.blogger.com/atom/ns#">Presentations</category><category domain="http://www.blogger.com/atom/ns#">Public Health England</category><title>Presentation on identifying COVID-19 inpatients from Public Health England data</title><description>&lt;p&gt;This is a presentation I gave at the &lt;a href=&quot;https://www.covid19hg.org&quot;&gt;COVID-19 Host Genetics Initiative&lt;/a&gt; meeting on &lt;a href=&quot;https://www.covid19hg.org/blog/2020-07-02-july-2-2020-meeting/&quot;&gt;2nd July 2020&lt;/a&gt; about using Public Health England&#39;s Second Generation Surveillance System to identify COVID-19 inpatients among SARS-CoV-2 positive individuals in England.&lt;/p&gt;&lt;div class=&quot;separator&quot; style=&quot;clear: both; text-align: center;&quot;&gt;&lt;iframe allowfullscreen=&quot;&quot; class=&quot;BLOG_video_class&quot; height=&quot;346&quot; src=&quot;https://www.youtube.com/embed/BySQxUMZWRo&quot; width=&quot;640&quot; youtube-src-id=&quot;BySQxUMZWRo&quot;&gt;&lt;/iframe&gt;&lt;/div&gt;&lt;p&gt;For further information, please see this &lt;a href=&quot;https://news.bugbank.uk/2020/08/identifying-inpatients-comparison-to.html&quot;&gt;bugbank blog post&lt;/a&gt; comparing inpatients identified using SGSS and Hospital Episode Statistics.&lt;/p&gt;</description><link>http://blog.danielwilson.me.uk/2020/08/presentation-on-identifying-covid-19.html</link><author>noreply@blogger.com (Daniel Wilson)</author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="https://img.youtube.com/vi/BySQxUMZWRo/default.jpg" height="72" width="72"/><thr:total>0</thr:total></item></channel></rss>