<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>DataBytes Podcast</title>
    <description>Website for DataBytes podcast.</description>
    <link>https://databytespodcast.github.io/</link>
    <atom:link href="https://databytespodcast.github.io/sitemap.xml" rel="self" type="application/rss+xml"/>
    <pubDate>Thu, 23 Jan 2020 02:32:19 +0000</pubDate>
    <lastBuildDate>Thu, 23 Jan 2020 02:32:19 +0000</lastBuildDate>
    <generator>Jekyll v3.8.5</generator>
    
      <item>
        <title>Episode 49: Extreme Classification: Going at MACH Speed (Part 1)</title>
        <description>&lt;p&gt;In this episode, Dr. Derek Feng drops by to chat about a recent paper on a divide-and-conquer approach (Merged-Averaged Classifiers via Hashing) to massive classification problems. In part 1 (of 2 episodes), we describe the general problem solved by and strategy taken by MACH, wherein the original large classification problem is broken down into smaller-sized classification problems. Next week in the second episode, we talk about more technical details of how the division of labor works, and why it works.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/49-Extreme-Classification-Going-at-MACH-Speed-Part-1-ea7uiq&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h2 id=&quot;sources&quot;&gt;Sources&lt;/h2&gt;

&lt;ul&gt;
  &lt;li&gt;&lt;a href=&quot;https://arxiv.org/pdf/1910.13830.pdf&quot;&gt;NeurIPS 2019: MACH paper&lt;/a&gt;&lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 17 Jan 2020 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2020/01/17/mach1.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2020/01/17/mach1.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 48: Where Moneyball Meets Footy</title>
        <description>&lt;p&gt;We’ve long heard about the waves that statistics has made in baseball. But what about soccer? In this episode, we summarize a few applications of statistics in European football (or American soccer).&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/48-Where-Moneyball-Meets-Footy-e9h18p&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h2 id=&quot;sources&quot;&gt;Sources&lt;/h2&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://fivethirtyeight.com/features/down-at-halftime-in-a-soccer-game-use-your-subs/&quot;&gt;FiveThirtyEight.com: Down At Halftime In A Soccer Game? Use Your Subs.&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.espn.com/soccer/english-premier-league/23/blog/post/3733383/premier-league-teams-rarely-use-all-their-substitutes-why-dont-they-take-advantage-of-such-fresh-legs&quot;&gt;ESPN.com blog: Premier League teams rarely use all their substitutes. Why don’t they take advantage of such fresh legs?&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.nytimes.com/2019/05/22/magazine/soccer-data-liverpool.html&quot;&gt;NYT Magazine: How Data (and Some Breathtaking Soccer) Brought Liverpool to the Cusp of Glory&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;http://freakonomics.com/podcast/london-live/&quot;&gt;Freakonomics Podcast: Can Britain Get Its “Great” Back? (Ep. 393)&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.independent.co.uk/sport/football/transfers/takumi-minamino-liverpool-transfer-news-salzburg-melissa-reddy-latest-a9243881.html&quot;&gt;The Independent: Takumi Minamino: How RB Salzburg scouted the perfect Liverpool player&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 13 Dec 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/12/13/footy-moneyball.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/12/13/footy-moneyball.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 47: Domoic Acid Testing -- A Crabshoot?</title>
        <description>&lt;p&gt;Domoic acid has plagued shellfish and other wildlife along the Pacific coastline in recent years. Testing for domoic acid concentration in crabs on a regular basis has become important for determining when crabs and their viscera can be safely consumed. Unlike many other common hypothesis tests, the setup used for domoic acid testing is based on the sample maximum rather than the sample mean. In this episode, we critique the testing methodology.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/47-Domoic-Acid-Testing----A-Crabshoot-e991fc&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h2 id=&quot;sources&quot;&gt;Sources&lt;/h2&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://en.wikipedia.org/wiki/Domoic_acid&quot;&gt;Wikipedia.com: Domoic acid&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.sfchronicle.com/food/article/The-secret-Richmond-lab-where-Bay-Area-crab-14869631.php&quot;&gt;SF Chronicle: The secret Richmond lab where Bay Area crab season annually learns its fate&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.cdph.ca.gov/Programs/CEH/DFDCS/CDPH%20Document%20Library/FDB/FoodSafetyProgram/DomoicAcid/4.%20Crab%20DA%20Web%20Results%20July%201%202019%20to%20November%2020%202019.pdf&quot;&gt;California Department of Public Health: Domoic Acid Data for July-November 2019&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.kqed.org/news/10868506/acid-flashback-santa-cruz-bird-frenzy-hitchcock-and-a-biological-whodunit&quot;&gt;KQED News: Acid Flashback: Santa Cruz Bird Frenzy, Hitchcock and a Biological Whodunit&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Sat, 30 Nov 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/11/30/crabbing-domoic-acid.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/11/30/crabbing-domoic-acid.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 46: Finding Your (Niche) Board Games</title>
        <description>&lt;p&gt;In this episode, we discuss how two statisticians used data from BoardGameGeek.com to put together their own board game recommendation engine, specifically designed to stay away from mainstream recommendations.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/46-Finding-Your-Niche-Board-Games-e8smo8&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h2 id=&quot;sources&quot;&gt;Sources&lt;/h2&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://rss.onlinelibrary.wiley.com/doi/10.1111/j.1740-9713.2019.01317.x&quot;&gt;Significance.com article: Mining the BoardGameGeek&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://trythesegames.com&quot;&gt;TryTheseGames&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://en.wikipedia.org/wiki/Eurogame&quot;&gt;Eurogame Wikipedia Entry&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;

</description>
        <pubDate>Fri, 08 Nov 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/11/08/board-games.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/11/08/board-games.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 45: Learning Publicly, with Private Data</title>
        <description>&lt;p&gt;In this episode, Dr. Derek Feng discusses the general issue of data privacy in the age of big data, including topics of differential privacy and federated learning.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/45-Learning-Publicly--with-Private-Data-e8gfkg&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h2 id=&quot;sources&quot;&gt;Sources&lt;/h2&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://arxiv.org/pdf/cs/0610105.pdf&quot;&gt;Research article: Robust De-anonymization of Large Datasets&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://blog.cryptographyengineering.com/2016/06/15/what-is-differential-privacy/&quot;&gt;Blogpost: What is Differential Privacy&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.apple.com/privacy/docs/Differential_Privacy_Overview.pdf&quot;&gt;Apple.com: Differential Privacy Overview&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.wired.com/2016/06/apples-differential-privacy-collecting-data/&quot;&gt;Wired.com: Apple’s Differential Privacy is About Collecting Your Data&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://arxiv.org/pdf/1902.01046.pdf&quot;&gt;Research article: Towards Federated Learning At Scale: System Design&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://federated.withgoogle.com/&quot;&gt;Federated Learning with Google&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://medium.com/syncedreview/federated-learning-the-future-of-distributed-machine-learning-eec95242d897&quot;&gt;Medium.com: Federated Learning: The Future of Distributed Machine Learning&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://ai.googleblog.com/2017/04/federated-learning-collaborative.html&quot;&gt;Google AI Blog on Federated Learning&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://arxiv.org/pdf/1812.02903.pdf&quot;&gt;Research Article: Applied Federated Learning: Improving Google Keyboard Query Suggestions&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 01 Nov 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/11/01/data-privacy.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/11/01/data-privacy.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 44: A Conversation with Jon Krohn</title>
        <description>&lt;p&gt;We sit down with Dr. Jon Krohn to chat about his work as a Chief Data Scientist at untapt, his newly published bestseller “Deep Learning Illustrated”, and his teaching/research.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/44-A-Conversation-with-Jon-Krohn-e81bra&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h2 id=&quot;link&quot;&gt;Link&lt;/h2&gt;

&lt;ul&gt;
  &lt;li&gt;&lt;a href=&quot;https://www.deeplearningillustrated.com/&quot;&gt;Deep Learning Illustrated website&lt;/a&gt;&lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 25 Oct 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/10/25/jon-krohn.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/10/25/jon-krohn.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 43: To Google and Back</title>
        <description>&lt;p&gt;In this episode, Professor Albert Y. Kim of Smith College describes his post-PhD journey, which included a stint at Google Adwords before academic posts at Reed College, Middlebury College, Amherst College, and Smith College.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/43-To-Google-and-Back-e5ofvi&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

</description>
        <pubDate>Fri, 04 Oct 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/10/04/to-google-and-back.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/10/04/to-google-and-back.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 42: Black in the Box</title>
        <description>&lt;p&gt;Dr. Derek Feng joins us again to discuss the two metrics by which we align all statistical/machine learning methods – interpretability versus predictive ability. In a world where black box methods reign supreme, what does learning mean?&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/42-Black-in-the-Box-e5i2p8&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h2 id=&quot;sources&quot;&gt;Sources&lt;/h2&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://en.wikipedia.org/wiki/Cooperative_Observer_Program&quot;&gt;Wikipedia: Cooperative Observer Program&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://foldingathome.org/&quot;&gt;Folding @ Home&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://deepmind.com/blog/article/alphafold&quot;&gt;DeepMind.com: Alpha Fold&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://onezero.medium.com/machine-learning-might-render-the-human-quest-for-knowledge-pointless-5425f8b00a45&quot;&gt;Medium.com: Machine Learning Widens the Gap Between Knowledge and Understanding&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 27 Sep 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/09/27/black-box.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/09/27/black-box.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 41: What to do with Outliers</title>
        <description>&lt;p&gt;Guest Dylan O’Connell joins us today to talk about a recent surprising, but legitimate Democratic primary poll result done by Monmouth University. We discuss different perspectives on how to approach a data point that doesn’t fit in with the others.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/41-What-to-do-with-Outliers-e5dk9k&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h2 id=&quot;sources&quot;&gt;Sources&lt;/h2&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.monmouth.edu/polling-institute/documents/monmouthpoll_us_082619.pdf/&quot;&gt;Monmouth University Poll&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.realclearpolitics.com/epolls/2020/president/us/2020_democratic_presidential_nomination-6730.html&quot;&gt;RealClearPolitics&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://twitter.com/johnanzo/status/1166729666268454912?s=21&quot;&gt;Anzalone tweet #1&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://twitter.com/johnanzo/status/1166171181931589632&quot;&gt;Anzalone tweet #2&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://twitter.com/MonmouthPoll/status/1166720853477924870&quot;&gt;Monmouth University Statement&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://projects.fivethirtyeight.com/pollster-ratings/&quot;&gt;FiveThirtyEight.com Pollster Ratings&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://twitter.com/NateSilver538/status/1166780637149388803&quot;&gt;Nate Silver’s tweet on the poll&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.math.upenn.edu/~deturck/m170/wk4/lecture/case2.html&quot;&gt;1948 Presidential Election polling&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 20 Sep 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/09/20/outliers-polling.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/09/20/outliers-polling.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 40: Making a DIY ML-Controlled Cat Door</title>
        <description>&lt;p&gt;Outdoor-cat owners know all too well the unpleasantries of dealing with what the cat dragged in. A self-proclaimed machine learning novice proves that you don’t need to be a pro to set up a smart cat door that prevents the cat from bringing prey into your home.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/40-Making-a-DIY-ML-Controlled-Cat-Door-e4toho&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h2 id=&quot;sources&quot;&gt;Sources&lt;/h2&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.bbc.com/news/technology-48825761&quot;&gt;bbc.com article: Cat flap uses AI to punish pet’s killer instincts&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.theverge.com/tldr/2019/6/30/19102430/amazon-engineer-ai-powered-catflap-prey-ben-hamm&quot;&gt;The Verge: An Amazon employee made an AI-powered cat flap to stop his cat from bringing home dead animals&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://igniteseattle.com/&quot;&gt;Ignite Seattle&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://docs.aws.amazon.com/deeplens/latest/dg/what-is-deeplens.html&quot;&gt;AWS DeepLens&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;

</description>
        <pubDate>Fri, 13 Sep 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/09/13/ml-cat-door.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/09/13/ml-cat-door.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 39: Rolling in the Deep Patient</title>
        <description>&lt;p&gt;We take a deep dive into the poster child for black-box machine learning methods, namely Deep Patient: an unsupervised learning method that uses denoising auto-encoders as the means for extracting salient features in electronic health records, which in turn can then be used to predict health outcomes. We do our best to explain what on earth the previous sentence meant.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/39-Rolling-in-the-Deep-Patient-e5802m&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h2 id=&quot;sources&quot;&gt;Sources&lt;/h2&gt;

&lt;ul&gt;
  &lt;li&gt;&lt;a href=&quot;https://www.nature.com/articles/srep26094&quot;&gt;Deep Patient article&lt;/a&gt;&lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 06 Sep 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/09/06/deep-patient.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/09/06/deep-patient.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 38: The Misuse of Statistics in Court</title>
        <description>&lt;p&gt;In this episode, we talk about how a statistical concept that you would learn about in an introductory course was misused in court.  The error led to dire consequences in the case of Sally Clark who was charged in the deaths of two of her children.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/38-The-Misuse-of-Statistics-in-Court-e4toep&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h2 id=&quot;sources&quot;&gt;Sources&lt;/h2&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://web.archive.org/web/20110824151124/http://www.rss.org.uk/uploadedfiles/documentlibrary/744.pdf&quot;&gt;Royal Statistical Society concerned by issues raised in Sally Clark case&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;http://www.statslab.cam.ac.uk/~apd/SallyClark_report.doc&quot;&gt;Sally Clark Appeal by Professor A. P. Dawid&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://rss.onlinelibrary.wiley.com/doi/full/10.1111/j.1740-9713.2005.00077.x&quot;&gt;Article: Reflections on the cot death cases&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://onlinelibrary.wiley.com/doi/pdf/10.5694/j.1326-5377.2004.tb06162.x&quot;&gt;MJA Article: Unexpected infant death: lessons from the Sally Clark case&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4934658/&quot;&gt;Prosecutor’s Fallacy Paper&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 30 Aug 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/08/30/misuse-stats-court.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/08/30/misuse-stats-court.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 37: Susan Starts a New Job</title>
        <description>&lt;p&gt;In this episode, we talk about Susan’s new job as a Data Scientist!  She recently transitioned from academia to industry and we discuss her experience with searching for positions, interviewing, and her first few weeks in her new role.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/37-Susan-Starts-a-New-Job-e4tojg&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;
</description>
        <pubDate>Fri, 23 Aug 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/08/23/susan-new-job.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/08/23/susan-new-job.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 36: What's New in Machine Learning Startups</title>
        <description>&lt;p&gt;In this episode, we talk about some machine learning startups to pay attention to this year.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/36-Whats-New-in-Machine-Learning-Startups-e4ekhj&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.forbes.com/sites/louiscolumbus/2019/05/27/25-machine-learning-startups-to-watch-in-2019/#538f835e3c0b&quot;&gt;25 Machine Learning Startups To Watch In 2019&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.prnewswire.com/news-releases/ablacon-inc-raises-21-5m-series-a-to-advance-ai-enabled-atrial-fibrillation-mapping-system-300840324.html&quot;&gt;Ablacon Raises $21.5M&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.startups.com/library/expert-advice/series-funding-a-b-c-d-e&quot;&gt;Startup funding, explained&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://techcrunch.com/2019/05/21/people-ai-the-predictive-sales-startup-raises-60m-at-around-500m-valuation/&quot;&gt;People.ai, the predictive sales startup, raises $60M&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 16 Aug 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/08/16/ml-startups.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/08/16/ml-startups.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 35: You Look How You Sound</title>
        <description>&lt;p&gt;Deep learning has been useful for lots of applications when it comes to prediction. Yet another is the use of a short sound clip of speech to predict the face of the speaker.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/35-Using-voice-to-predict-appearance-e4eksr&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.sciencealert.com/this-ai-tries-to-guess-what-you-look-like-based-on-your-voice&quot;&gt;This Creepy AI Predicts What You Look Like Based on Your Voice&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://arxiv.org/abs/1905.09773&quot;&gt;Speech2Face paper: Speech2Face: Learning the Face Behind a Voice&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://speech2face.github.io/&quot;&gt;Speech2Face website: Learning the Face Behind a Voice&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://looking-to-listen.github.io/&quot;&gt;AVSpeech paper website&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 09 Aug 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/08/09/voice-appearance.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/08/09/voice-appearance.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 34: Protecting Kids' Digital Privacy</title>
        <description>&lt;p&gt;In this episode, we talk about protecting kids’ digital privacy.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/34-Protecting-Kids-Digital-Privacy-e4apu7&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.nbcnews.com/tech/tech-news/kid-browsing-company-says-its-artificial-intelligence-can-tell-n1009021&quot;&gt;Is that a kid browsing? This company says its artificial intelligence can tell&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.superawesome.com/&quot;&gt;SuperAwesome.com: The technology powering the kids digital media ecosystem&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.businessnewsdaily.com/10625-businesses-collecting-data.html&quot;&gt;How Businesses Are Collecting Data (And What They’re Doing With It)&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://leginfo.legislature.ca.gov/faces/billTextClient.xhtml?bill_id=201720180AB375&quot;&gt;CA CCPA&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.ftc.gov/enforcement/rules/rulemaking-regulatory-reform-proceedings/childrens-online-privacy-protection-rule&quot;&gt;Children’s Online Privacy Protection Rule (“COPPA”)&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.unicef.org/media/media_102560.html&quot;&gt;UNICEF: More than 175,000 children go online for the first time every day, tapping into great opportunities, but facing grave risks&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 02 Aug 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/08/02/kids-digital-privacy.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/08/02/kids-digital-privacy.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 33: Statisticians Hate Post-Hoc Power</title>
        <description>&lt;p&gt;Statistics is key to demonstrating the effectiveness of new advancements in science and medicine, but when statistical significance is not achieved, is post-hoc power a valid justification?&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/33-Statisticians-Hate-Post-Hoc-Power-e4ekpn&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.journalofsurgicalresearch.com/article/S0022-4804(19)30185-4/fulltext&quot;&gt;Journal of Surgical Research article: Is the Power Threshold of 0.8 Applicable to Surgical Science?—Empowering the Underpowered Study&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://retractionwatch.com/2019/06/19/statisticians-clamor-for-retraction-of-paper-by-harvard-researchers-they-say-uses-a-nonsense-statistic/&quot;&gt;RetractionWatch: Statisticians Clamor for Retraction of Paper by Harvard Researchers&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;http://daniellakens.blogspot.com/2014/12/observed-power-and-what-to-do-if-your.html&quot;&gt;Blogpost: Observed power, and what to do if your editor asks for post-hoc power analyses&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://lesslikely.com/statistics/observed-power-magic/&quot;&gt;Blogpost: Calculating Observed Power Is Just Transforming Noise&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;

</description>
        <pubDate>Fri, 26 Jul 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/07/26/post-hoc-power.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/07/26/post-hoc-power.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 32: Amazon's 3D Body Scan Study</title>
        <description>&lt;p&gt;In this episode, we talk about Amazon’s 3D body scan study.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/32-Amazons-3D-Body-Scan-Study-e4dh1i&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://mashable.com/article/amazon-body-labs-image-scanning-study/&quot;&gt;Amazon is 3D-scanning people’s bodies in exchange for gift cards&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.theverge.com/2019/5/23/18637369/amazon-body-labs-3d-scanning-study-new-york-volunteer-fashion&quot;&gt;Amazon wants to 3D-scan volunteers’ bodies for a $25 gift card&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.businessinsider.com/amazon-3d-body-scanning-for-clothes-2018-5&quot;&gt;Amazon is reportedly scanning people’s bodies so it can sell you clothes&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.wsj.com/articles/amazon-studies-body-sizes-to-get-that-perfect-clothing-fit-1525355115?tesla=y&quot;&gt;Amazon Wants to Know Your Waistline&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.economist.com/science-and-technology/2019/05/23/online-identification-is-getting-more-and-more-intrusive&quot;&gt;Online identification is getting more and more intrusive&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.theverge.com/2019/6/11/18661595/facebook-study-app-monitor-phone-usage-pay&quot;&gt;Facebook will pay you to let it track what you do on your phone&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;

</description>
        <pubDate>Fri, 19 Jul 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/07/19/amazon-3d.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/07/19/amazon-3d.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 31: What Data Visualizations Do You Care About? It's Personal</title>
        <description>&lt;p&gt;In this episode, we talk about how data are personal for those in a rural Pennsylvania community.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/31-What-Data-Visualizations-Do-You-Care-About--Its-Personal-e4ap0f&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://medium.com/multiple-views-visualization-research-explained/data-is-personal-what-we-learned-from-42-interviews-in-rural-america-93539f25836d&quot;&gt;Data is Personal. What We Learned from 42 Interviews in Rural America.&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://arxiv.org/pdf/1901.01920.pdf&quot;&gt;Research article: Data is Personal: Attitudes and Perceptions of Data Visualization in Rural Pennsylvania&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 12 Jul 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/07/12/data-personal.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/07/12/data-personal.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 30: Some Like It Hot -- What Gender Reveals About Our Temperature Preferences</title>
        <description>&lt;p&gt;Word on the street is that women prefer warmer temperatures than men do. Researchers designed an experiment to investigate whether this is actually true, specifically, considering how men and women perform on various cognitive tasks under different temperature scenarios. In this episode, we dissect the study so you can judge whether you believe the results.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;&lt;a href=&quot;https://journals.plos.org/plosone/article?id=10.1371/journal.pone.0216362&quot;&gt;Plos One article: Battle for the thermostat: Gender and the effect of temperature on cognitive performance&lt;/a&gt;&lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 05 Jul 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/07/05/temperature-gender.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/07/05/temperature-gender.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 29: Jeopardy! Meets Statistics</title>
        <description>&lt;p&gt;Jeopardy! is a weeknightly televised trivia game show. In recent months, one player, James Holzhauer has taken the Jeopardy! fandom by storm with his unusual style of play and his long run of big wins. In this episode, we discuss how statistics can help explain his betting tactics, and we discuss how some other Jeopardy! players have used statistics to help up their game.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/29-Jeopardy--Meets-Statistics-e4ekv5&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.vox.com/culture/2019/6/3/18650485/jeopardy-james-holzhauer-loses-record-winnings&quot;&gt;James Holzhauer’s Jeopardy winning streak has come to an end&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.wired.com/story/jeopardy-record-james-holzhauer-strategy/&quot;&gt;Inside James Holzhauer’s Jeopardy!-dominating Strategy&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://cdr.lib.unc.edu/concern/parent/tb09j9193/file_sets/bz60d095h&quot;&gt;Emma Boettcher’s Master Thesis&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://futurism.com/jeopardy-emma-boettcher-ai-james-holzhauer&quot;&gt;We Found “Jeopardy!” Kingslayer Emma Boettcher’s Thesis on Data Mining&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://gawker.com/5860275/how-a-geek-cracked-the-jeopardy-code&quot;&gt;How a Geek Cracked the Jeopardy! Code&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 28 Jun 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/06/28/jeopardy.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/06/28/jeopardy.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 28: Facial Recognition Technology Update and Rating Trustworthiness of AI-Generated Airbnb Profiles</title>
        <description>&lt;p&gt;In this episode, we discuss a number of miscellaneous news updates regarding facial recognition technology (concerning San Francisco, Amazon, and pandas!).  And then, we talk about how much we trust AI-generated profiles for Airbnb.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/28-Facial-Recognition-Technology-Update-and-Rating-Trustworthiness-of-AI-Generated-Airbnb-Profiles-e46bp8&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.salon.com/2019/05/21/san-franciscos-facial-recognition-ban-still-lets-corporations-spy-on-you/&quot;&gt;San Francisco’s facial recognition ban still lets corporations spy on you&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.cnbc.com/2018/12/06/how-amazon-rekognition-works-and-what-its-used-for.html&quot;&gt;Amazon’s facial recognition service is being used to scan mugshots, but it’s also used to track innocuous things like soccer balls&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.nytimes.com/2019/05/22/technology/amazon-climate-change-facial-recognition.html&quot;&gt;Amazon Investors Reject Proposals on Climate Change and Facial Recognition&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.cnbc.com/2019/05/25/amazon-facial-recognition-ban-won-just-2percent-of-shareholder-vote.html&quot;&gt;Amazon facial recognition ban won just 2% of shareholder vote&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.theverge.com/2019/5/22/18635632/amazon-shareholders-vote-facial-recognition-climate-change-investors-employees&quot;&gt;Amazon shareholders vote down proposals on facial recognition and climate change&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://tech.cornell.edu/news/ai-generated-profiles-airbnb-users-prefer-a-human-touch/&quot;&gt;AI-generated profiles? Airbnb users prefer a human touch&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;http://www.mauricejakesch.com/pub/chi2019__ai_mc_camera_ready.pdf&quot;&gt;CHI 2019 Paper: AI-Mediated Communication: How the Perception that Profile Text was Written by AI Affects Trustworthiness&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 21 Jun 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/06/21/facial-recog-trustworthiness-airbnb.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/06/21/facial-recog-trustworthiness-airbnb.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 27: Does Uber/Lyft Help Or Hurt Traffic Congestion and Machine Learning Interpretability</title>
        <description>&lt;p&gt;In this episode, we look at a study about whether ride-sharing services contribute to increased or decreased traffic congestion in San Francisco. We then discuss some strategies to build interpretable machine learning models.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/27-Does-UberLyft-Help-Or-Hurt-Traffic-Congestion-and-Machine-Learning-Interpretability-e4af56&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://advances.sciencemag.org/content/5/5/eaau2670/tab-pdf&quot;&gt;Science Advances article: Do transportation network companies decrease or increase congestion?&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.sfcta.org/sf-champ-modeling&quot;&gt;SF-CHAMP Modeling&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.kdnuggets.com/2018/03/gdpr-machine-learning-illegal.html&quot;&gt;KDNuggets.com: Will GDPR Make Machine Learning Illegal?&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://christophm.github.io/interpretable-ml-book/&quot;&gt;Interpretable Machine Learning free online textbook&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.reddit.com/r/MachineLearning/comments/7w46zv/p_lime_explaining_the_predictions_of_any_machine/&quot;&gt;Reddit.com: [P] Lime: Explaining the predictions of any machine learning classifier&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://uc-r.github.io/lime&quot;&gt;UC Business Analytics R Programming Guide: Visualizing ML Models with LIME&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://arxiv.org/abs/1602.04938&quot;&gt;arXiv.org: “Why Should I Trust You?”: Explaining the Predictions of Any Classifier&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://arxiv.org/abs/1705.07874&quot;&gt;arXiv.org: A Unified Approach to Interpreting Model Predictions&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 14 Jun 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/06/14/ride-sharing-ml-interpretability.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/06/14/ride-sharing-ml-interpretability.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 26: Household Electronics That See and Google's Reservation AI</title>
        <description>&lt;p&gt;In this episode, we talk about a new innovation that enables household electronics to see what’s around them. We then discuss Google Duplex, an AI designed to happily make reservations and appointments for you.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/26-Household-Electronics-That-See-and-Googles-Reservation-AI-e43ph9&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.economist.com/science-and-technology/2019/05/11/https://www.economist.com/science-and-technology/2019/05/11/household-electronics-are-undergoing-a-sensory-makeoverhousehold-electronics-are-undergoing-a-sensory-makeover&quot;&gt;The Economist: Household electronics are undergoing a sensory makeover&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.theverge.com/2019/1/4/18168565/amazon-alexa-devices-how-many-sold-number-100-million-dave-limp&quot;&gt;The Verge: Amazon Says 100 Million Alexa Devices Have Been Sold — What’s Next?&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://gizmodo.com/the-terrible-truth-about-alexa-1834075404&quot;&gt;Gizmodo: The Terrible Truth About Alexa&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.bloomberg.com/news/articles/2019-04-10/is-anyone-listening-to-you-on-alexa-a-global-team-reviews-audio&quot;&gt;Bloomberg: Amazon Workers Are Listening to What You Tell Alexa&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;http://www.gierad.com/projects/surfacesight/&quot;&gt;SurfaceSight&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.youtube.com/watch?v=znNe4pMCsD4&quot;&gt;Google Duplex Demo&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.theverge.com/2019/5/9/18538194/google-duplex-ai-restaurants-experiences-review-robocalls&quot;&gt;The Verge: One Year Later, Restaurants Are Still Confused By Google Duplex&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.theverge.com/2019/5/7/18531195/google-duplex-web-update-car-rentals-movie-tickets-io-2019&quot;&gt;The Verge: Google is bringing Duplex to the web to help book car rentals and movie tickets&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.forbes.com/sites/tomtaulli/2019/04/21/what-you-need-to-know-about-chatbots/#29c56d444844&quot;&gt;Forbes: What You Need To Know About Chatbots&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 07 Jun 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/06/07/household-elec-google-duplex.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/06/07/household-elec-google-duplex.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 25: DataFest 2019 and Measuring Migrations from Hurricane Maria</title>
        <description>&lt;p&gt;Susan recently served as a judge at a local DataFest competition (a weekend-long data competition for undergraduates). She shares her experiences and recommendations for future contestants. We then discuss how Facebook data might be helpful for counting the number of people how migrated from Puerto Rico to the mainland U.S. as a result of Hurricane Maria.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/25-DataFest-2019-and-Measuring-Migrations-from-Hurricane-Maria-e43pen&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://ww2.amstat.org/education/datafest/index.cfm&quot;&gt;ASA Datafest Website&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.sciencenews.org/article/facebook-data-show-how-many-people-left-puerto-rico-after-hurricane-maria&quot;&gt;Science News: Facebook data show how many people left Puerto Rico after Hurricane Maria&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://osf.io/preprints/socarxiv/39s6c/&quot;&gt;Research article: The impact of Hurricane Maria on out-migration from Puerto Rico: Evidence from Facebook data&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://centropr.hunter.cuny.edu/sites/default/files/data_briefs/Hurricane_maria_1YR.pdf&quot;&gt;Puerto Rico One Year After Hurricane Maria&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 31 May 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/05/31/datafest-hurricane-maria.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/05/31/datafest-hurricane-maria.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 24: Predictive Power of Early Polling and Did a TV Show Result in Higher Teenage Suicides?</title>
        <description>&lt;p&gt;In this episode, we discuss FiveThirtyEight.com’s analysis of primary election polling over the past 40 years. In particular, we consider whether early polling is helpful for predicting election outcomes.  And then, we talk about a study that potentially blames Netflix for a surge in teenage suicides in 2017.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/24-Predictive-Power-of-Early-Polling-and-Did-a-TV-Show-Result-in-Higher-Teenage-Suicides-e43oic&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://fivethirtyeight.com/features/we-analyzed-40-years-of-primary-polls-even-early-on-theyre-fairly-predictive/&quot;&gt;We Analyzed 40 Years Of Primary Polls. Even Early On, They’re Fairly Predictive.&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.jaacap.org/article/S0890-8567(19)30288-6/fulltext&quot;&gt;Research Article: Association Between the Release of Netflix’s 13 Reasons Why and Suicide Rates in the United States: An Interrupted Times Series Analysis&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.npr.org/2019/04/30/718529255/teen-suicide-spiked-after-debut-of-netflixs-13-reasons-why-report-says&quot;&gt;NPR: Teen Suicide Spiked After Debut Of Netflix’s ‘13 Reasons Why,’ Study Says&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://tylervigen.com/spurious-correlations&quot;&gt;Spurious Correlations&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 24 May 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/05/24/538polling-suicides.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/05/24/538polling-suicides.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 23: Offline Song Identification and Perceptions about AI</title>
        <description>&lt;p&gt;In this episode, we discuss how Google’s Now Playing feature can identify songs that are playing around you, using embeddings. We then talk about a study that reports on America’s perceptions about artificial intelligence – who can we trust to develop AI responsibly?&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/23-Offline-Song-Identification-and-Perceptions-about-AI-e3rkht&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.pcmag.com/news/356833/googles-pixel-2-phones-recognize-17-300-songs-offline&quot;&gt;Google’s Pixel 2 Phones Recognize 17,300 Songs Offline&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://ai.googleblog.com/2018/09/googles-next-generation-music.html&quot;&gt;Google’s Next Generation Music Recognition&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;http://www.claudiobellei.com/2018/01/06/backprop-word2vec/&quot;&gt;Word2Vec tutorial&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://governanceai.github.io/US-Public-Opinion-Report-Jan-2019/&quot;&gt;Artificial Intelligence: American Attitudes and Trends&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.artificialintelligence-news.com/2019/01/10/report-public-ai-benefit-humanity/&quot;&gt;SOCIETY Report: The public is unconvinced AI will benefit humanity&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.vox.com/future-perfect/2019/1/9/18174081/fhi-govai-ai-safety-american-public-worried-ai-catastrophe&quot;&gt;Vox: The American public is already worried about AI catastrophe&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.bloomberg.com/news/articles/2019-01-10/u-s-military-trusted-more-than-google-facebook-to-develop-ai&quot;&gt;U.S. Military Trusted More Than Google, Facebook to Develop AI&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 17 May 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/05/17/now-playing-perceptions-ai.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/05/17/now-playing-perceptions-ai.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 22: Betting on the Game of Thrones and the Misfortune of Lefthandedness</title>
        <description>&lt;p&gt;In this episode, we discuss how bookmakers price/take bets on outcomes in the Game of Thrones. We then discuss a study that claimed that lefthanded people have shorter life expectancies than righthanded people. Spoiler alert: lefthanders have nothing to worry about!&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/22-Betting-on-the-Game-of-Thrones-and-the-Misfortune-of-Lefthandedness-e3rkh6&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.pinnacle.com/en/betting-articles/Betting-Strategy/how-bookmakers-work/SF72KYQE4FZAA4TZ&quot;&gt;Pinnacle.com: How Bookmakers Work&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://mybookie.ag/sportsbook/got/&quot;&gt;Mybookie.ag: Game of Thrones Bets&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.onlinegambling.com/news/2018/03/game-of-thrones-betting-halted-after-suspicious-wagers-on-iron-throne/&quot;&gt;‘Game of Thrones’ Betting Halted After Suspicious Rash of Wagers on Long Shot to Win Iron Throne&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.oddsshark.com/entertainment/game-thrones-prop-odds-bet-who-will-be-ruling-westeros&quot;&gt;OddsShark: Bet on Who Will be Ruling Westeros&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.nature.com/news/the-power-of-prediction-markets-1.20820&quot;&gt;Nature.com: The power of prediction markets&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.ncbi.nlm.nih.gov/pubmed/2006231&quot;&gt;Psychology Bulletin: Left-handedness: a marker for decreased survival fitness.&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 10 May 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/05/10/got-lefthanded.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/05/10/got-lefthanded.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 21: Pitch Call Accuracy and Predicting the Outcome of the Champions League</title>
        <description>&lt;p&gt;Buckle up for a sports-filled episode! We discuss a study that analyzes the accuracy of umpire calls about strikes vs. balls and take a deep dive into FiveThirtyEight.com’s statistical methods for predicting the winner of the Champions League.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/21-Pitch-Call-Accuracy-and-Predicting-the-Outcome-of-the-Champions-League-e3rkfh&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.bu.edu/today/2019/mlb-umpires-strike-zone-accuracy/&quot;&gt;MLB Umpires Missed 34,294 Ball-Strike Calls in 2018. Bring on Robo-umps?&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;http://mlb.mlb.com/documents/0/8/0/268272080/2018_Official_Baseball_Rules.pdf&quot;&gt;Official Baseball Rules 2018&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://projects.fivethirtyeight.com/soccer-predictions/champions-league/&quot;&gt;FiveThirtyEight: Champions League Predictions&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://fivethirtyeight.com/methodology/how-our-club-soccer-predictions-work/&quot;&gt;FiveThirtyEight: How Our Club Soccer Predictions Work&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 03 May 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/05/03/umpiring-accuracy-soccer-predictions.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/05/03/umpiring-accuracy-soccer-predictions.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 20: Thinking Like Computers and Text Mining the Mueller Report</title>
        <description>&lt;p&gt;In this episode, we discuss a study that recruits human researchers to try to predict how computers classify images. We then highlight a number of examples of natural language processing techniques applied to the Mueller Report.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/20-Thinking-Like-Computers-and-Text-Mining-the-Mueller-Report-e3o0tg&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.sciencedaily.com/releases/2019/03/190322090239.htm&quot;&gt;Researchers get humans to think like computers&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.nature.com/articles/s41467-019-08931-6.pdf&quot;&gt;Nature Communications: Humans can decipher adversarial images&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://spdustin.gitlab.io/the-mueller-report/Part%201.html&quot;&gt;Mueller Report and “Data Science” (part 1 in a series)&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.jlukito.com/blog/2019/4/20/using-r-to-analyze-the-redacted-mueller-report&quot;&gt;Using R To Analyze The Redacted Mueller Report&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 26 Apr 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/04/26/computer-thinking-mueller-report.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/04/26/computer-thinking-mueller-report.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 19: Seeing with AI and Detecting Exoplanets</title>
        <description>&lt;p&gt;In this episode, we discuss Microsoft’s handy phone application for scanning and reporting on our surroundings, as a way of helping vision impaired individuals better interact with the world around them. We then talk about how AI can be useful in detecting exoplanets (or extrasolar planets).&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/19-Seeing-with-AI-and-Detecting-Exoplanets-e3o0sv&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.microsoft.com/en-us/seeing-ai&quot;&gt;Microsoft’s Seeing AI app&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.npr.org/2019/04/01/707967899/young-astronomer-uses-artificial-intelligence-to-discover-2-exoplanets&quot;&gt;NPR: Young Astronomer Uses Artificial Intelligence To Discover 2 Exoplanets&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.cfa.harvard.edu/~avanderb/Deep_Learning_2.pdf&quot;&gt;“Identifying Exoplanets With Deep Learning II” paper&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://iopscience.iop.org/article/10.3847/1538-3881/aa9e09/pdf&quot;&gt;“Identifying Exoplanets with Deep Learning” paper&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 19 Apr 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/04/19/seeing-exoplanets.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/04/19/seeing-exoplanets.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 18: Statistical Anxiety and the Fight Against Statistical Significance</title>
        <description>&lt;p&gt;We discuss a survey designed to analyze the extent and root cause of statistical anxiety in the classroom, discussing the methods/limitations of the study. We then talk about yet another crusade against hypothesis testing, this time around the concept of “statistical significance”.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/18-Statistical-Anxiety-and-the-Fight-Against-Statistical-Significance-e3luq7&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://psycnet.apa.org/record/2019-01035-001&quot;&gt;Using network science to understand statistics anxiety among college students&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.sciencedaily.com/releases/2019/01/190116111131.htm&quot;&gt;‘Statistics anxiety’ is real, and new research suggests targeted ways to handle it&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.nature.com/articles/d41586-019-00857-9&quot;&gt;Scientists rise up against statistical significance&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.amstat.org/asa/files/pdfs/P-ValueStatement.pdf&quot;&gt;American Statistical Association Releases Statement On Statistical Significance And p-Values&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 12 Apr 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/04/12/statistical-anxiety-significance.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/04/12/statistical-anxiety-significance.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 17: How Theranos Sinned Statistically</title>
        <description>&lt;p&gt;In this episode, Susan Wang is joined by guest Natalie Doss to consider the statistical sins committed by Theranos, the former blood testing unicorn. From arbitrary data manipulation to inappropriate data aggregation, we discuss what they did and why these practices were particularly bad. Then, we weigh in on how Theranos could have done worse, making it harder for the public to find out about their faulty tests.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/17-How-Theranos-Sinned-Statistically-e3jfgt&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;&lt;a href=&quot;https://www.amazon.com/Bad-Blood-Secrets-Silicon-Startup/dp/152473165X&quot;&gt;Bad Blood&lt;/a&gt;&lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 05 Apr 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/04/05/Theranos.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/04/05/Theranos.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 16: Machine-Generated Faces/Text, and Relating Health Outcomes to Skin Tone</title>
        <description>&lt;p&gt;We discuss NVIDIA’s AI-generated faces that look incredibly authentic, and relatedly, OpenAI’s text generator that is so capable that it has to be kept under wraps. We then assess the study design of a recent research article that considered how health outcomes vary amongst African Americans of different skin tones.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/16-Machine-Generated-Faces--Text--and-Relating-Health-Outcomes-to-Skin-Color-e3bu1g&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.cnn.com/2019/02/28/tech/ai-fake-faces/index.html&quot;&gt;CNN Article on AI-generated Faces&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://thispersondoesnotexist.com&quot;&gt;thispersondoesnotexist.com&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://skymind.ai/wiki/generative-adversarial-network-gan&quot;&gt;Beginner’s Guide to GANs&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://github.com/NVlabs/stylegan&quot;&gt;StyleGAN on Github&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://arxiv.org/pdf/1812.04948.pdf&quot;&gt;StyleGAN paper on Arxiv&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.sciencealert.com/scientists-developed-an-ai-so-advanced-they-say-it-s-too-dangerous-to-release&quot;&gt;Article about OpenAI&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://statmodeling.stat.columbia.edu/2019/02/27/light-privilege-skin-tone-stratification-in-health-among-african-americans/&quot;&gt;Andrew Gelman article on Skin Tone paper&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://journals.sagepub.com/doi/pdf/10.1177/2332649218793670&quot;&gt;Light Privilege? Skin Tone Stratification in Health among African Americans&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.ncbi.nlm.nih.gov/projects/gap/cgi-bin/document.cgi?study_id=phs000309.v2.p2&amp;amp;phd=3472&quot;&gt;CARDIA Y20 Follow-up Exam VII Protocol&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 15 Mar 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/03/15/AI-faces-skin-tone.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/03/15/AI-faces-skin-tone.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 15: Deep Learning to Fold Proteins and Automated Journalism</title>
        <description>&lt;p&gt;We discuss opportunities for machines and humans in the prediction of protein structures, a necessary task in new drug discovery. Google’s DeepMind has taken the prize in the recent iteration of CASP, a protein folding prediction challenge. We also discuss how AI has begun to revolutionize journalism.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/15-Deep-Learning-to-Fold-Proteins-and-Automated-Journalism-e37ms3&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.nytimes.com/2019/02/05/technology/artificial-intelligence-drug-research-deepmind.html?partner=rss&amp;amp;emc=rss&quot;&gt;Making New Drugs With a Dose of Artificial Intelligence&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://moalquraishi.wordpress.com/2018/12/09/alphafold-casp13-what-just-happened/&quot;&gt;Mohammed AlQuraishi Blogpost on CASP13&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://fold.it/portal/info/faq&quot;&gt;FoldIt FAQs&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://endlessmedia.news/media-deepdive/the-power-of-subjectivity-in-the-age-of-robot-journalism-118/&quot;&gt;The power of subjectivity in the age of robot journalism&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.nytimes.com/2019/02/05/business/media/artificial-intelligence-journalism-robots.html&quot;&gt;The Rise of the Robot Reporter&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://medium.com/@orge/this-is-the-future-of-journalism-will-a-machine-get-it-right-d3e747f16751&quot;&gt;Medium.com Article: The Future of Journalism: Will Robots Get it Right?&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.forbes.com/sites/nicolemartin1/2019/02/08/did-a-robot-write-this-how-ai-is-impacting-journalism/#1721e7fb7795&quot;&gt;Forbes.com: Did A Robot Write This? How AI Is Impacting Journalism&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.institutionalinvestor.com/article/b15130p2nnv8dr/why-listen-to-earnings-calls-when-artificial-intelligence-can-do-it-better&quot;&gt;Why Listen to Earnings Calls When Artificial Intelligence Can Do It Better?&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://insight.factset.com/interpreting-earnings-calls-with-natural-language-processing&quot;&gt;Interpreting Earnings Calls with Natural Language Processing&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 08 Mar 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/03/08/protein-folding-auto-journalism.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/03/08/protein-folding-auto-journalism.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 14: A Personality Test that Makes Sense and What Does Spotify Know?</title>
        <description>&lt;p&gt;FiveThirtyEight.com has provided a free, online personality test that might make more sense than your typical online clickbaity quiz. We talk about why it calls itself the only personality test that isn’t junk science. We then discuss the results of a recent study on Spotify data. Does it know too much about us (and you)? We’ll let you know.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/Episode-14-A-Personality-Test-that-Makes-Sense-and-What-Does-Spotify-Know-e33j9j&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://projects.fivethirtyeight.com/personality-quiz/&quot;&gt;FiveThirtyEight personality test&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://arstechnica.com/science/2019/01/spotify-data-shows-how-music-preferences-change-with-latitude/#p3&quot;&gt;Spotify data shows how music preferences change with latitude&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.nature.com/articles/s41562-018-0508-z&quot;&gt;Original research article: Global music streaming data reveal diurnal and seasonal patterns of affective preference&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 01 Mar 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/03/01/personality-test-spotify.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/03/01/personality-test-spotify.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 13: IBM's Debate Machine and Adopting a 'Data Culture' in Companies</title>
        <description>&lt;p&gt;On February 11, IBM showcased its Project Debater in a face-off against debate champion Harish Natarajan. We talk about how this machine vs. human competition went. Then, we discuss a Harvard Business Review article citing a survey that discovered companies are not becoming data-oriented quickly enough.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/Episode-13-IBMs-Debate-Machine-and-Adopting-a-Data-Culture-in-Companies-e37mq1&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;http://fortune.com/2019/02/12/man-versus-machine-ai-artificial-intelligence-ibm-project-debater/&quot;&gt;Fortune.com article on Project Debater&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.youtube.com/watch?v=m3u-1yttrVw&quot;&gt;Youtube video of Project Debater vs. Harish Natarajan&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://hbr.org/2019/02/companies-are-failing-in-their-efforts-to-become-data-driven&quot;&gt;HBR Article: Companies Are Failing in Their Efforts to Become Data-Driven&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;http://newvantage.com/wp-content/uploads/2018/12/Big-Data-Executive-Survey-2019-Findings-Updated-010219-1.pdf&quot;&gt;NVP Big Data and AI Executive Survey 2019 Findings&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 22 Feb 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/02/22/debate-ibm-nvp.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/02/22/debate-ibm-nvp.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 12: Super Bowl Stats, Confidence Intervals, and Data Sources</title>
        <description>&lt;p&gt;Three topics are featured in this episode: first, statistics about Super Bowl LIII, including what was in the bowls as the game happened; second, a fun activity for teaching confidence intervals; finally, we present some online sources for data.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/Episode-12-Super-Bowl-Stats--Confidence-Intervals--and-Data-Sources-e35h2v&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.drovers.com/article/super-bowl-food-statistics-2019&quot;&gt;Super Bowl Food Statistics for 2019&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.wusa9.com/article/sports/nfl/superbowl/all-the-records-set-during-super-bowl-53/507-c1b28a03-cb4a-4146-9240-5eecc78573ae&quot;&gt;All the records set during Super Bowl 53&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.nationalchickencouncil.org/americans-to-eat-more-than-1-3-billion-chicken-wings-for-super-bowl/&quot;&gt;Americans to Eat More than 1.3 Billion Chicken Wings for Super Bowl&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://nrf.com/media-center/press-releases/fewer-consumers-celebrating-valentines-day-those-who-do-are-spending&quot;&gt;Fewer consumers celebrating Valentine’s Day but those who do are spending more&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://amstat.tandfonline.com/doi/abs/10.1080/00031305.2012.752408&quot;&gt;Twenty-Five Analogies for Explaining Statistical Concepts&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://amstat.tandfonline.com/doi/abs/10.1080/00031305.2017.1305294#.XF8aqc9KjOQ&quot;&gt;Enriching Students’ Conceptual Understanding of Confidence Intervals: An Interactive Trivia-Based Classroom Activity&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;

&lt;h3 id=&quot;questions-for-confidence-interval-activity&quot;&gt;Questions for Confidence Interval Activity&lt;/h3&gt;

&lt;p&gt;The questions below were asked in the podcast. The answers are provided in line. Answers that are not immediately obvious through a Google search are linked to their sources.&lt;/p&gt;

&lt;ol&gt;
  &lt;li&gt;
    &lt;p&gt;What’s the average distance from the Earth to Mars in kilometers?” &lt;a href=&quot;https://www.space.com/14729-spacekids-distance-earth-mars.html&quot;&gt;225 mil km&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;What’s the height of Denali (formerly Mt. McKinley) in feet? 20,310ft to 20,320 ft&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;What’s the minimum number of moves required to solve any Rubik’s cube? 20.&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;What year was the first toothpaste tube invented? 1873&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;How many men signed the Declaration of Independence? 56&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;How many milligrams of caffeine on average are in a shot of Starbucks espresso? 89 mg&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;What percentage of American adults is estimated to own a smartphone , as of 2018? &lt;a href=&quot;http://www.pewglobal.org/2019/02/05/smartphone-ownership-is-growing-rapidly-around-the-world-but-not-always-equally/&quot;&gt;81%&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;What is the greatest amount of snow to fall in a single US location over 24 hour period, in inches? 75.8”&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;In 2017, how much beef did Americans consume per person on average (in lbs)? &lt;a href=&quot;https://www.nationalchickencouncil.org/about-the-industry/statistics/per-capita-consumption-of-poultry-and-livestock-1965-to-estimated-2012-in-pounds/&quot;&gt;56.9 lbs&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;As of Feb 1, 2019, how many bitcoins are there in circulation? &lt;a href=&quot;https://www.blockchain.com/en/charts/total-bitcoins&quot;&gt;17,516,000&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ol&gt;
</description>
        <pubDate>Fri, 15 Feb 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/02/15/superbowl53-CI-datasources.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/02/15/superbowl53-CI-datasources.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 11: How Machines Might be Biased and the Job Market for Data Scientists</title>
        <description>&lt;p&gt;AI and ML algorithms are growing popular – but they can actually perpetuate cognitive biases in our daily lives. We discuss the state of the problem and possible solutions. We also present a favorable job outlook for aspiring (or continuing!) data scientists.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/Episode-11-How-Machines-Might-be-Biased-and-the-Job-Market-for-Data-Scientists-e33ddj&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://arstechnica.com/tech-policy/2019/01/yes-algorithms-can-be-biased-heres-why/#p3&quot;&gt;Yes, algorithms can be biased&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://developers.google.com/machine-learning/fairness-overview/&quot;&gt;Google: Machine Learning Fairness&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://qz.com/958666/the-reason-why-most-of-the-images-are-men-when-you-search-for-doctor/&quot;&gt;The reason why most of the images that show up when you search for doctor are white men&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.propublica.org/article/how-we-analyzed-the-compas-recidivism-algorithm&quot;&gt;ProPublica COMPAS Study&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://medium.com/ibm-watson-data-lab/cognitive-bias-in-machine-learning-d287838eeb4b&quot;&gt;Cognitive Bias in Machine Learning&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://stanford.edu/~cpiech/bio/papers/fairnessAdversary.pdf&quot;&gt;Achieving Fairness through Adversarial Learning: an Application to Recidivism Prediction paper&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://spectrum.ieee.org/view-from-the-valley/at-work/tech-careers/demand-and-salaries-for-data-scientists-continue-to-climb&quot;&gt;Demand and Salaries for Data Scientists Continue to Climb&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 08 Feb 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/02/08/ML-bias-jobs-data-science.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/02/08/ML-bias-jobs-data-science.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 10: AI in Medicine and Racial Bias in College Admissions</title>
        <description>&lt;p&gt;Artificial intelligence is starting to make waves in medicine; we look at how technology might potentially change how medical testing works. We also bring in some statistical reasoning in the debate of whether or not there is racial discrimination in Harvard’s college admissions process.&lt;/p&gt;

&lt;iframe src=&quot;https://anchor.fm/databytes/embed/episodes/Episode-10-AI-in-Medicine-and-Racial-Bias-in-College-Admissions-e3385t&quot; height=&quot;102px&quot; width=&quot;400px&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.nature.com/articles/s41591-018-0300-7&quot;&gt;High-performance medicine: the convergence of human and artificial intelligence&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;http://bostonreview.net/law-justice/andrew-gelman-sharad-goel-daniel-e-ho-what-statistics-cant-tell-us-fight-over&quot;&gt;What Statistics Can’t Tell Us in the Fight over Affirmative Action at Harvard&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.nytimes.com/2018/12/20/us/harvard-asian-american-students-discrimination.html&quot;&gt;The Harvard Bias Suit by Asian-Americans: 5 Key Issues&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;http://samv91khoyt2i553a2t1s05i-wpengine.netdna-ssl.com/wp-content/uploads/2018/06/Doc-415-1-Arcidiacono-Expert-Report.pdf&quot;&gt;Harvard Case Expert Report&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.thecrimson.com/article/2018/6/16/harvard-admissions-behind-the-scenes/&quot;&gt;Harvard Ranks Applicants on ‘Humor’ and ‘Grit,’ Court Filings Show&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 01 Feb 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/02/01/episode-10-AI-med-harvard.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/02/01/episode-10-AI-med-harvard.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 9: Lessons Learned from Making a Fitbit Data Visualization Shiny App</title>
        <description>&lt;p&gt;Dynamic data visualization widgets can be pretty cool, but it takes more than just statistical chops to build an online visualization app that supports input data from users. In this episode, we describe the journey that Susan took to build a visualization app for Fitbit data. The app can be found at http://fitbitvizwiz.ddns.net.&lt;/p&gt;

&lt;iframe src=&quot;https://www.podbean.com/media/player/435y9-a5b04c?from=yiiadmin&amp;amp;download=1&amp;amp;version=1&quot; data-link=&quot;https://www.podbean.com/media/player/435y9-a5b04c?from=yiiadmin&amp;amp;download=1&amp;amp;version=1&quot; height=&quot;122&quot; width=&quot;100%&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot; data-name=&quot;pb-iframe-player&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;&lt;a href=&quot;http://fitbitvizwiz.ddns.net&quot;&gt;Fitbit Viz Wiz Shiny App&lt;/a&gt;&lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 25 Jan 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/01/25/episode-9-fitbit-viz.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/01/25/episode-9-fitbit-viz.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 8: The French Revolution and the Challenge of Reproducibility</title>
        <description>&lt;p&gt;What can machine learning tell us about the French Revolution? This episode describes a brief history lesson of the digital humanities. Then, why do we constantly hear about the word “reproducibility” in the context of scientific research? We’ll explore what this means and why it seems to keep happening.&lt;/p&gt;

&lt;iframe src=&quot;https://www.podbean.com/media/player/qvevx-a4ea2d?from=yiiadmin&amp;amp;download=1&amp;amp;version=1&quot; data-link=&quot;https://www.podbean.com/media/player/qvevx-a4ea2d?from=yiiadmin&amp;amp;download=1&amp;amp;version=1&quot; height=&quot;122&quot; width=&quot;100%&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot; data-name=&quot;pb-iframe-player&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://arstechnica.com/science/2019/01/machine-learning-can-offer-new-tools-fresh-insights-for-the-humanities/&quot;&gt;Machine learning can offer new tools, fresh insights for the humanities&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.pnas.org/content/115/18/4607#sec-7&quot;&gt;PNAS article: Individuals, institutions, and innovation in the debates of the French Revolution&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://modernismmodernity.org/forums/posts/search-and-replace&quot;&gt;Search and Replace: Josephine Miles and the Origins of Distant Reading&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://babel.hathitrust.org/cgi/pt?id=inu.39000003574840;view=1up;seq=25&quot;&gt;Concordance of the Poetical Works of John Dryden&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;http://www.corpusthomisticum.org/it/index.age&quot;&gt;Index Thomisticus&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://digitalcommons.unl.edu/cgi/viewcontent.cgi?article=1069&amp;amp;context=classicsfacpub&quot;&gt;Roberto Busa, S.J., and the Invention of the Machine-Generated Concordance&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://theconversation.com/how-big-data-has-created-a-big-crisis-in-science-102835&quot;&gt;How big data has created a big crisis in science&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://journals.sagepub.com/doi/abs/10.1177/2515245918810225?casa_token=o3G_KxAOhRYAAAAA%3AQs38Zw0okdinmAfKfJZNxTX_Lfn9VYf4A9TJeX9QQDbEOIua2TQbM-UBwfOQl9jz_z3cVvjLhsDz_w&amp;amp;&quot;&gt;Many Labs 2: Investigating Variation in Replicability Across Samples and Settings&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 18 Jan 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/01/18/episode-8-digital-humanities-reproducibility.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/01/18/episode-8-digital-humanities-reproducibility.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 7: The Virtual Maestro and the Most Influential Movie</title>
        <description>&lt;p&gt;Have you ever wanted to try your hand at conducting an orchestra? Now you can, with Google’s Semi-Conductor online app. We’ll talk about how this browser-based app analyzes your body positions in real time to translate your actions into Mozart music. We also talk about a way to use network analysis to determine the most influential movie ever made to date. Be sure to tune in to find out which movie takes the prize.&lt;/p&gt;

&lt;iframe src=&quot;https://www.podbean.com/media/player/kbywj-a41fbb?from=yiiadmin&amp;amp;download=1&amp;amp;version=1&quot; data-link=&quot;https://www.podbean.com/media/player/kbywj-a41fbb?from=yiiadmin&amp;amp;download=1&amp;amp;version=1&quot; height=&quot;122&quot; width=&quot;100%&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot; data-name=&quot;pb-iframe-player&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://experiments.withgoogle.com/semi-conductor&quot;&gt;Semi-Conductor with Google&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://youtu.be/L7lxRjJvAns&quot;&gt;Video of Google Semi-Conductor in Action&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://medium.com/tensorflow/real-time-human-pose-estimation-in-the-browser-with-tensorflow-js-7dd0bc881cd5&quot;&gt;Pose Estimation with TensorFlow&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://arxiv.org/abs/1505.07427&quot;&gt;PoseNet Paper&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.sciencedaily.com/releases/2018/11/181129223426.htm&quot;&gt;Most Influential Movie of All Time&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://appliednetsci.springeropen.com/articles/10.1007/s41109-018-0105-0&quot;&gt;Identification of key films and personalities in the history of cinema from a Western perspective&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Fri, 11 Jan 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/01/11/episode-7-semiconductor-influential-movie.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/01/11/episode-7-semiconductor-influential-movie.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 6: Probability Games and Amazon's Own Self-Driving Car</title>
        <description>&lt;p&gt;What are the odds that a toss of a 10-sided die, followed by a toss of a 20-sided die, and then a toss of a 30-sided die land in increasing order? If you know the answer within a few seconds, you might have an edge in Borel, a game that is all about probability. We’ll also talk about DeepRacer, Amazon’s soon-to-come programmable self-driving car.&lt;/p&gt;

&lt;iframe src=&quot;https://www.podbean.com/media/player/fqy6s-a378d2?from=yiiadmin&amp;amp;download=1&amp;amp;version=1&quot; data-link=&quot;https://www.podbean.com/media/player/fqy6s-a378d2?from=yiiadmin&amp;amp;download=1&amp;amp;version=1&quot; height=&quot;122&quot; width=&quot;100%&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot; data-name=&quot;pb-iframe-player&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.playborel.com&quot;&gt;Borel Boardgame&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://aws.amazon.com/deepracer/&quot;&gt;AWS DeepRacer Site&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.inverse.com/article/51331-amazon-self-driving-cars&quot;&gt;Amazon Enters Self-Driving Car World With an Old, Successful Strategy&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;

</description>
        <pubDate>Fri, 04 Jan 2019 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2019/01/04/episode-6-borel-deepracer.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2019/01/04/episode-6-borel-deepracer.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 5: The Do's and Don'ts of Data Visualization</title>
        <description>&lt;p&gt;Data visualization is an integral pre-cursor to data analysis, providing a way to visually inspect the data for surprising trends and uncover potential errors in variable coding. In this episode, we cover some guiding principles of data visualization. A brief summary (including promised links to examples) is included below.&lt;/p&gt;

&lt;iframe src=&quot;https://www.podbean.com/media/player/u2ubt-a2e00d?from=site&amp;amp;skin=1&amp;amp;share=1&amp;amp;fonts=Helvetica&amp;amp;auto=0&amp;amp;download=1&amp;amp;version=1&quot; height=&quot;122&quot; width=&quot;100%&quot; frameborder=&quot;0&quot; scrolling=&quot;no&quot; data-name=&quot;pb-iframe-player&quot;&gt;&lt;/iframe&gt;

&lt;h4&gt;A summary of do's and don'ts:&lt;/h4&gt;
&lt;ul&gt;
&lt;li&gt;&lt;b&gt;Do:&lt;/b&gt; Label everything, concisely. (This includes specifying the units!)&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Do:&lt;/b&gt; Make sure the plot suits the kind of variable(s). Univariate plots –- histograms or barplots. Bivariate plots -– boxplots, scatterplots, stacked barplots, etc.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Do:&lt;/b&gt; Report/show plots that tell you something interesting -- and then say why it is interesting in words. Maybe it uncovers an unusual feature of the data, or outliers, or it suggests some kind of underlying associations that warrant further investigation.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Do:&lt;/b&gt; Carefully choose how many bins to use in your histograms. Or use density plots. (&lt;a href=&quot;https://statistics.laerd.com/statistical-guides/understanding-histograms.php&quot;&gt;Example of how bin width choice matters&lt;/a&gt;)&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Don't:&lt;/b&gt; Use too many colors (see bad pie chart below).&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Don't:&lt;/b&gt; Use smoothing procedures with more flexibility than you can accommodate with the number of observations that you have.
&lt;div class=&quot;row&quot;&gt;
  &lt;div class=&quot;col-sm-8&quot;&gt;
  &lt;p&gt;&lt;a href=&quot;http://htmlpreview.github.io/?https://gist.githubusercontent.com/swang87/fe16a765308c101216f7614cbd4d38b0/raw/2d000ea1c803b7f70fea10a848af10ce83657090/databytes_smoothing.html&quot;&gt;Example mentioned&lt;/a&gt; in the podcast.&lt;/p&gt;
  &lt;p&gt;To the right, we show another example taken from a Fitbit app screenshot (from one of our co-hosts). Note how despite an absence of data points between 2016 and 2018 (shown in the white line) does not prevent the app from interpolating with some parabolic spline in the region (blue curve). The blue curve fabricates an upward trend from 2016 to 2017 and then a downward trend from 2017 to 2018. &lt;/p&gt;
  &lt;/div&gt;
  &lt;div class=&quot;col-sm-4&quot;&gt;&lt;img src=&quot;/static/img/ep5_fitbit.png&quot; width=&quot;200&quot; /&gt;&lt;/div&gt;
&lt;/div&gt;&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Do:&lt;/b&gt; Jitter scatterplots to minimize overplotting. Or use translucency features of your plotting tool. (&lt;a href=&quot;https://python-graph-gallery.com/134-how-to-avoid-overplotting-with-python/&quot;&gt;Fixing overplotting in Python&lt;/a&gt; | &lt;a href=&quot;https://towardsdatascience.com/overshadowing-the-other-points-the-overplotting-issue-e6d1ebbdef20&quot;&gt;Fixing overplotting in R&lt;/a&gt;)&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Do: &lt;/b&gt;Sort your categorical variables (barplot categories based on heights or boxplot categories based on medians). (&lt;a href=&quot;https://moderndive.com/C-appendixC.html&quot;&gt;Example&lt;/a&gt;)&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Don't:&lt;/b&gt; Use pie charts. More on that below!&lt;/li&gt;
&lt;/ul&gt;
&lt;hr /&gt;

&lt;h3&gt;The Issue with Pie Charts&lt;/h3&gt;

&lt;figure&gt;
&lt;img src=&quot;https://66.media.tumblr.com/698249f0a55f9186d52d252759242532/tumblr_p3utcdJEdu1sgh0voo1_1280.jpg&quot; /&gt;
&lt;figcaption&gt;
Source: &lt;a href=&quot;http://viz.wtf/image/171134950336&quot;&gt;WTF Visualizations&lt;/a&gt;.
&lt;/figcaption&gt;
  &lt;/figure&gt;
&lt;p&gt;&lt;br /&gt;
This image just about encapsulates everything that is wrong with pie charts.&lt;/p&gt;
&lt;ul&gt;
&lt;li&gt;There are too many categories, making it difficult to discern which category is associated with which slice.&lt;/li&gt;
&lt;li&gt;The angling of the pie makes it hard to visually process the relative sizes of each slice.&lt;/li&gt;
&lt;li&gt;The pie chart occupies a lot of space for the information it is trying to convey.&lt;/li&gt;
&lt;/ul&gt;
&lt;p&gt;You can find multiple posts online that expand on why pie charts are often bad ways of visualizing data -- yes, there are longer rants on pie charts than the one we've given, such as the one &lt;a href=&quot;https://www.businessinsider.com/pie-charts-are-the-worst-2013-6&quot;&gt; here&lt;/a&gt;. We particularly like an example of why even simple pie charts (with few categories displayed) can fail:&lt;/p&gt;
&lt;p&gt;&lt;img src=&quot;https://amp.businessinsider.com/images/51bf1e9becad048c0a000002-960-326.jpg&quot; width=&quot;500&quot; /&gt;&lt;br /&gt;&lt;/p&gt;
&lt;p&gt;The example provided suggests that A, B, and C are pie charts that represent polling results for a 5-candidate race in a local election, done at 3 different time points. Can you tell who's in the lead at each time point?  &lt;/p&gt;
&lt;p&gt;&lt;img src=&quot;https://amp.businessinsider.com/images/51bf0aa8ecad04a05d00004a-960-369.jpg&quot; width=&quot;500&quot; /&gt;&lt;br /&gt;&lt;/p&gt;
&lt;p&gt;The bar charts here represent the same data. Not only can you tell who's in the lead at any of the 3 time points, but you can also easily tell the trajectory of how each candidate fared as time progressed. &lt;/p&gt;
&lt;p&gt;This leads us to our favorite pie chart:&lt;/p&gt;
&lt;figure&gt;&lt;img src=&quot;https://i.imgur.com/aRLRqwj.png&quot; /&gt;&lt;figcaption&gt;
  Source: &lt;a href=&quot;https://imgur.com/gallery/aRLRqwj&quot;&gt;imgur&lt;/a&gt;.
&lt;/figcaption&gt;&lt;/figure&gt;
&lt;h3&gt;The Naughty List&lt;/h3&gt;
&lt;p&gt;Now we present a list of some other truly horrific charts (that are not pie charts).&lt;/p&gt;
&lt;ol&gt;&lt;li&gt;
  &lt;figure&gt;
  &lt;img src=&quot;http://livingqlikview.com/wp-content/uploads/2017/04/Worst-Data-Visualizations-05.jpg&quot; /&gt;
    &lt;figcaption&gt;
      Source: &lt;a href=&quot;http://livingqlikview.com/the-9-worst-data-visualizations-ever-created/&quot;&gt;The 9 Worst Data Visualizations Ever Created&lt;/a&gt;
    &lt;/figcaption&gt;
  &lt;/figure&gt;
  &lt;p&gt;Pie charts aren't the only culprits. Here, the y-axis scale is deceiving.&lt;/p&gt;
&lt;/li&gt;
&lt;li&gt;
&lt;div class=&quot;row&quot;&gt;
  &lt;div class=&quot;col-sm-4&quot;&gt;&lt;figure&gt;&lt;img src=&quot;https://junkcharts.typepad.com/.a/6a00d8341e992c53ef01b8d2464d49970c-200wi&quot; /&gt;
&lt;figcaption&gt;Source: &lt;a href=&quot;https://junkcharts.typepad.com/junk_charts/wsj/&quot;&gt;Junk Charts&lt;/a&gt;&lt;/figcaption&gt;
&lt;/figure&gt;&lt;/div&gt;
  &lt;div class=&quot;col-sm-8&quot;&gt;&lt;p&gt;This plot, cut out of the Wall Street Journal, requires prolonged staring to realize how the bar lengths might possibly reflect any of the proportions provided. There's conditioning involved, in which case, a mosaicplot will probably do the data better justice, as suggested at the source website.&lt;/p&gt;
&lt;/div&gt;
&lt;/div&gt;


&lt;/li&gt;
&lt;li&gt;
&lt;figure&gt;&lt;img src=&quot;https://visme.co/blog/wp-content/uploads/2016/02/Percent-of-Job-Loses-Relative-to-Peak-Employment-Month.jpg&quot; width=&quot;700&quot; /&gt;
&lt;figcaption&gt;Source: &lt;a href=&quot;https://visme.co/blog/bad-infographics/&quot;&gt;Bad Infographics: 11 Mistakes You Never Want to Make&lt;/a&gt;&lt;/figcaption&gt;&lt;/figure&gt;
&lt;p&gt;Too many colors can make it challenging to differentiate various categories.&lt;/p&gt;
&lt;/li&gt;
&lt;/ol&gt;
&lt;h3&gt;The Nice List&lt;/h3&gt;
&lt;p&gt;Finally, this discussion wouldn’t be complete with some stellar examples of thoughtful graphics.&lt;/p&gt;
&lt;ol&gt;
&lt;li&gt;&lt;figure&gt;&lt;img src=&quot;https://raw.githubusercontent.com/halhen/viz-pub/master/pastime-income/pastime.png&quot; width=&quot;500&quot; /&gt;&lt;figcaption&gt;Source: &lt;a href=&quot;https://www.reddit.com/r/dataisbeautiful/comments/6heb75/income_distributions_in_americans_pastimes_oc/&quot;&gt;Reddit post&lt;/a&gt;&lt;/figcaption&gt;&lt;/figure&gt;
&lt;p&gt;This plot showcases how American pastimes differ by household income, using the American Time Use Survey dataset.&lt;/p&gt;&lt;/li&gt;
&lt;li&gt;&lt;figure&gt;&lt;img src=&quot;https://fivethirtyeight.com/wp-content/uploads/2016/11/morris-durant-1b.png?w=575&quot; /&gt;
&lt;figcaption&gt;Source: &lt;a href=&quot;https://fivethirtyeight.com/features/the-52-best-and-weirdest-charts-we-made-in-2016/&quot;&gt;Fivethirtyeight.com&lt;/a&gt;&lt;/figcaption&gt;&lt;/figure&gt;
&lt;p&gt;Ah, a plot of residuals (points per shot against expectations) to showcase the superiority of basketball players. Minor quibble: Not too sure why Curry, Thompson, Barnes, and Green have the same colors whereas other highlighted players are in different colors.&lt;/p&gt;
&lt;/li&gt;
&lt;li&gt;&lt;figure&gt;&lt;img src=&quot;/static/img/ep5_gapminder.png&quot; /&gt;
&lt;figcaption&gt;Source: &lt;a href=&quot;https://s3-eu-west-1.amazonaws.com/static.gapminder.org/GapminderMedia/wp-uploads/20161215212516/countries_health_wealth_2016_v151.pdf&quot;&gt;Gapminder&lt;/a&gt;
&lt;/figcaption&gt;&lt;/figure&gt;&lt;p&gt;Indeed, this example, from the late great Hans Rosling's organization, Gapminder, is an example of where arguably a lot of information is fit into a small space. However, this is one of those plots that is actually meant to encourage zooming in and taking a good look (the source link above will lead you to the full pdf image). Even in this shrunken view, the color-coding by region helps provide a big-picture look at the relationship between health and wealth of nations around the world. The sizes of the circles additionally showcase the population size of each nation.&lt;/p&gt;&lt;/li&gt;
&lt;/ol&gt;
&lt;h3&gt;Looking for more?&lt;/h3&gt;
&lt;p&gt;There’s a whole &lt;a href=&quot;reddit.com/r/dataisbeautiful/&quot;&gt;subreddit&lt;/a&gt; (/r/dataisbeautiful) full of them. We use these sometimes as inspiration – but of course, because Reddit is a free-for-all platform, not every post will be golden.&lt;/p&gt;
</description>
        <pubDate>Fri, 28 Dec 2018 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2018/12/28/episode-5-data-viz-guidelines.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2018/12/28/episode-5-data-viz-guidelines.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 4: Meet the Co-hosts (Part 2)</title>
        <description>&lt;p&gt;This week, we learn about Jessi Cisewski-Kehe’s background to find out how she went from a Math major to an actuarial analyst, then to grad school in statistics, followed by a three-year visiting assistant professor position at Carnegie Mellon where she got into Astrostatistics, and finally to her current position as an assistant professor at Yale.&lt;/p&gt;

&lt;iframe width=&quot;100%&quot; height=&quot;166&quot; scrolling=&quot;no&quot; frameborder=&quot;no&quot; allow=&quot;autoplay&quot; src=&quot;https://w.soundcloud.com/player/?url=https%3A//api.soundcloud.com/tracks/547041969&amp;amp;color=%2327a79c&amp;amp;auto_play=false&amp;amp;hide_related=false&amp;amp;show_comments=true&amp;amp;show_user=true&amp;amp;show_reposts=false&amp;amp;show_teaser=true&quot;&gt;&lt;/iframe&gt;

</description>
        <pubDate>Fri, 21 Dec 2018 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2018/12/21/episode-4-meet-the-cohosts-part2.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2018/12/21/episode-4-meet-the-cohosts-part2.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 3: Meet the Co-hosts (Part 1)</title>
        <description>&lt;p&gt;This week, we learn about Susan Wang’s background to find out how she went from an Applied Math major to actuarial consulting, then to a weather derivatives start-up firm, then to grad school in statistics, finally landing at Yale as a lecturer.&lt;/p&gt;

&lt;iframe width=&quot;100%&quot; height=&quot;300&quot; scrolling=&quot;no&quot; frameborder=&quot;no&quot; allow=&quot;autoplay&quot; src=&quot;https://w.soundcloud.com/player/?url=https%3A//api.soundcloud.com/tracks/543732027&amp;amp;color=%23ff5500&amp;amp;auto_play=false&amp;amp;hide_related=false&amp;amp;show_comments=true&amp;amp;show_user=true&amp;amp;show_reposts=false&amp;amp;show_teaser=true&amp;amp;visual=true&quot;&gt;&lt;/iframe&gt;

</description>
        <pubDate>Wed, 12 Dec 2018 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2018/12/12/episode-3-meet-the-cohosts-part1.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2018/12/12/episode-3-meet-the-cohosts-part1.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 2: Biometric Technology at Airports, Google Smart Replies, Bestselling Books</title>
        <description>&lt;p&gt;In this episode, we discuss biometric technology used at airports, Google Smart Replies (and letting AI compose our emails/texts for us), and an analysis of New York Times Bestsellers list data.&lt;/p&gt;

&lt;iframe width=&quot;100%&quot; height=&quot;300&quot; scrolling=&quot;no&quot; frameborder=&quot;no&quot; allow=&quot;autoplay&quot; src=&quot;https://w.soundcloud.com/player/?url=https%3A//api.soundcloud.com/tracks/539954403&amp;amp;color=%23ff5500&amp;amp;auto_play=false&amp;amp;hide_related=false&amp;amp;show_comments=true&amp;amp;show_user=true&amp;amp;show_reposts=false&amp;amp;show_teaser=true&amp;amp;visual=true&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.mediapost.com/publications/article/328124/jetblue-partners-with-us-customs-for-biometric-b.html&quot;&gt;JetBlue Partners With U.S. Customs For Biometric Boarding&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.cnn.com/travel/article/atlanta-airport-first-us-biometric-terminal-facial-recognition/index.html&quot;&gt;US airport opens first fully biometric terminal&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.npr.org/sections/alltechconsidered/2017/06/26/534131967/facial-recognition-may-boost-airport-security-but-raises-privacy-worries&quot;&gt;Facial Recognition May Boost Airport Security But Raises Privacy Worries&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.androidpolice.com/2018/06/05/smart-replies-android-messages-now-rolling-users/&quot;&gt;Smart Replies in Android Messages are now rolling out to more users&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://towardsdatascience.com/artistic-style-transfer-b7566a216431&quot;&gt;Artistic Style Transfer Tutorial&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://deepart.io/hire/&quot;&gt;Upload Your Own Images for Artistic Style Transfer&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://theconversation.com/what-big-data-can-tell-us-about-how-a-book-becomes-a-best-seller-106427&quot;&gt;What big data can tell us about how a book becomes a best-seller&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Tue, 04 Dec 2018 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2018/12/04/episode-2-biometric-tech.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2018/12/04/episode-2-biometric-tech.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
      <item>
        <title>Episode 1: Thanksgiving, College Football, International Prize in Statistics</title>
        <description>&lt;p&gt;The first episode of the DataBytes Podcast where we discuss popular topics related to data, statistics, data science, machine learning, artificial intelligence.  In this episode, we discuss Thanksgiving food, the College Football Playoff selection, and the winner of the International Prize in Statistics.&lt;/p&gt;

&lt;iframe width=&quot;100%&quot; height=&quot;166&quot; scrolling=&quot;no&quot; frameborder=&quot;no&quot; allow=&quot;autoplay&quot; src=&quot;https://w.soundcloud.com/player/?url=https%3A//api.soundcloud.com/tracks/537519510&amp;amp;color=%2327a79c&amp;amp;auto_play=false&amp;amp;hide_related=false&amp;amp;show_comments=true&amp;amp;show_user=true&amp;amp;show_reposts=false&amp;amp;show_teaser=true&quot;&gt;&lt;/iframe&gt;

&lt;h3 id=&quot;sources&quot;&gt;Sources&lt;/h3&gt;

&lt;ul&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://fivethirtyeight.com/features/the-ultimate-thanksgiving-dinner-menu/&quot;&gt;FiveThirtyEight’s Thanksgiving Survey Results&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://thepowerrank.com/guide-cfb-rankings/&quot;&gt;ThePowerRank.com’s College Football Rankings&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://collegefootballplayoff.com/sports/2016/9/30/_131504729609884945.aspx&quot;&gt;College Football Playoff Selection Methods&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://massey-peabody.com/methodology/&quot;&gt;Massey-Peabody Ranking Methodology&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
  &lt;li&gt;
    &lt;p&gt;&lt;a href=&quot;https://www.statslife.org.uk/news/3982-2018-international-prize-in-statistics-awarded-to-bradley-efron&quot;&gt;Announcement of International Prize in Statistics 2018&lt;/a&gt;&lt;/p&gt;
  &lt;/li&gt;
&lt;/ul&gt;
</description>
        <pubDate>Thu, 29 Nov 2018 00:00:00 +0000</pubDate>
        <link>https://databytespodcast.github.io/episode/2018/11/29/episode-1-thanksgiving-football-prize.html</link>
        <guid isPermaLink="true">https://databytespodcast.github.io/episode/2018/11/29/episode-1-thanksgiving-football-prize.html</guid>
        
        
        <category>episode</category>
        
      </item>
    
    
      <item>
        <title>Cool project 1</title>
        <description>Cool project 1</description>
        <link>https://databytespodcast.github.io#</link>
        <pubDate>Wed, 01 Jan 2014 00:00:00 +0000</pubDate>
        
        <category>Angular JS</category>
        
        <category>API</category>
        
      </item>
    
      <item>
        <title>Cool project 2</title>
        <description>Cool project 2</description>
        <link>https://databytespodcast.github.io#</link>
        <pubDate>Thu, 01 May 2014 00:00:00 +0000</pubDate>
        
        <category>Android</category>
        
        <category>PHP</category>
        
      </item>
    
      <item>
        <title>Cool project 3</title>
        <description>Cool project 3</description>
        <link>https://databytespodcast.github.io#</link>
        <pubDate>Sun, 01 Jun 2014 00:00:00 +0000</pubDate>
        
        <category>HTML</category>
        
        <category>JQuery</category>
        
        <category>PHP</category>
        
      </item>
    
      <item>
        <title>Cool project 4</title>
        <description>Cool project 4</description>
        <link>https://databytespodcast.github.io</link>
        <pubDate>Sat, 01 Oct 2016 00:00:00 +0000</pubDate>
        
        <category>Android</category>
        
        <category>nodejs</category>
        
      </item>
    
  </channel>
</rss>
