<!doctype html>
<html xmlns="http://www.w3.org/1999/xhtml" xmlns:v="urn:schemas-microsoft-com:vml" xmlns:o="urn:schemas-microsoft-com:office:office" lang="en-US" xml:lang="en-US">
  <head>
    <title data-ignore-plain-text>Generative AI - Short &amp;amp; Sweet 09 - 🐠 OpenAI&rsquo;s Whisper</title>
    <meta http-equiv="content-type" content="text/html; charset=utf-8">
    <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
    <meta name="format-detection" content="address=no">
    <!--[if (gte mso 9)|(IE)]>
    <style type="text/css" media="screen">
      li {
        text-indent: -1em;
      }
    </style>
    <![endif]-->
    <style type="text/css" media="all">
      body,
.section-text-area,
.section-text-area-wrapper,
.section-text-cell {
    overflow-wrap: break-word;
    word-wrap: break-word;
    -ms-word-break: break-all;
    word-break: break-word;
}
body {
    width: 100% !important;
    min-width: 100% !important;
    -ms-text-size-adjust: none;
    -webkit-text-size-adjust: none;
    mso-line-height-rule: exactly;
}
p {
    margin-block: 0;
}
@media only screen and (max-width:  593px ) {
    table#newsletter-table {
        border: 0 !important;
    }
    table#newsletter-email {
        width: 100% !important;
    }
    img.section-scaleable-image,
    img.section-empty-img {
        max-width: 100% !important;
        height: auto !important;
    }
    .bg-none {
        background: none !important;
    }
    .hauto {
        height: auto !important;
    }
    .show-desktop-only {
        display: none !important;
    }
    .show-mobile-only {
        display: block !important;
        float: none !important;
        line-height: auto !important;
        max-height: inherit !important;
        max-width: inherit !important;
        margin-top: 0px !important;
        overflow: visible !important;
        visibility: inherit !important;
        width: auto !important;
    }
    .stack-cell-wrap {
        display: block !important;
    }
    .stack-cell-up {
        display: table-header-group !important;
    }
    .stack-cell-down {
        display: table-footer-group !important;
    }
    .mw100p {
        max-width: 100% !important;
    }
    .section-horizontal-padding,
    .padding-mobile-both {
        padding-left: 22px !important;
        padding-right: 22px !important;
    }
    .padding-mobile-left {
        padding-left: 22px !important;
    }
    .padding-mobile-right {
        padding-right: 22px !important;
    }
    .text-left {
        text-align: left !important;
    }
    .text-right {
        text-align: right !important;
    }
    .w100p {
        width: 100% !important;
    }
}
.button-style-solid:hover,
.button-style-rounded:hover {
    opacity: .8 !important;
}
a:hover {
    text-decoration: none !important;
}
span.mail-merge-preview {
    border-bottom: 2px dotted currentColor;
    display: inline-block;
    line-height: 1em !important;
    margin-bottom: .125em !important;
}
table#newsletter-section-body .linked-site-title-link {
    color: #1d8fb4 !important;
}
#header-header-section-split-left-0 .brand-name .linked-site-title-link {
    color: #000;
    text-decoration: none;
}
#footer-footer-section-split-right-0 .brand-name .linked-site-title-link {
    color: #000;
    text-decoration: none;
}
#footer-footer-section-split-right-0 .footer-text .linked-site-title-link {
    color: #1d8fb4;
}
body.renderedPreview #line-line-section-14 div.basic-line[data-line="dashed"] {
    border-width: .5px 0 !important;
}
body.renderedPreview #line-line-section-16 div.basic-line[data-line="dashed"] {
    border-width: 1px 0 !important;
}

    </style>
    
    
    <!--[if mso]>
    <noscript>
      <xml>
        <o:OfficeDocumentSettings>
          <o:AllowPNG/>
          <o:PixelsPerInch>96</o:PixelsPerInch>
        </o:OfficeDocumentSettings>
      </xml>
    </noscript>
    <![endif]-->
    
    <!--[if (mso)|(mso 16)]>
      <style type="text/css">
        a {text-decoration: none;}
      </style>
    <![endif]-->
  </head>
  <body style="padding:0;margin:0;text-align:center;background-color:#fff;">
    <table role="article" aria-label="Generative AI - Short &amp;amp; Sweet 09 - 🐠 OpenAI&rsquo;s Whisper" lang="en-US" cellpadding="0" cellspacing="0" border="0" align="center" id="newsletter-table" style="font-size:16px;font-weight:normal;width:100%;padding:0px;background-color:#fff;border-top:44px solid #fff;border-bottom:44px solid #fff;margin:0 auto;text-align:center;table-layout:fixed;">
  <tbody><tr>
    <td align="center" valign="top" bgcolor="#FFFFFF" id="newsletter-cell" style="font-size:.9375em;">
      <div data-ignore-plain-text class="newsletter-preview-text" style="color:transparent;display:none !important;height:0;max-height:0;max-width:0;opacity:0;overflow:hidden;mso-hide:all;visibility:hidden;width:0;">
        
            
            OpenAI’s Whisper. It is an Automatic Speech Recognition (ASR) system that aims to recognize what has been said and transcribes it to text.&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;͏‌&nbsp;
        
      </div>
      <table border="0" cellpadding="0" cellspacing="0" width="594" bgcolor="transparent" id="newsletter-email">
        <tbody><tr>
          <td align="center" valign="top" id="newsletter-email-wrapper" class="fixed-contrast-1">
            <table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" id="newsletter-section-header">
              <tbody><tr>
                <td align="center" valign="middle" id="newsletter-section-header-cell">
                  
<div id="header-header-section-split-left-0">





<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="header-section header-section-split section-content" style="background-color:transparent;">
  <tbody><tr>
    <td class="section-content-cell" style="padding-top:22px;padding-right:22px;padding-bottom:22px;padding-left:22px;">
      <table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0">
        <tbody><tr>
          <td align="left" valign="middle" width="50%" class="section-text-area">
            
  
  
  
    
    <a class="brand-logo-link" href="https://generativeai.net/" style="color:#1d8fb4 !important;"><img class="brand-logo" src="https://images.squarespace-cdn.com/content/5bfd6f322487fdb33ce53474/0d4a27f0-be01-492c-8844-fc39234a717d/Screen+Shot+2018-12-18+at+15.01.15.png?content-type=image%2Fpng&amp;format=750w" height="61" alt="Generative AI" style="font-size:.6630127298444131em;display:block;border:0;text-decoration:none;line-height:0;font-weight:normal;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;color:#000;height:auto;max-height:61px;max-width:100%;width:auto;margin-left:0px;"></a>
    
  

          </td>
          <td align="right" valign="middle" width="50%" class="section-text-area">
            
          </td>
        </tr>
      </tbody></table>
    </td>
  </tr>
</tbody></table>

</div>
                </td>
              </tr>
            </tbody></table>
            <table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" id="newsletter-section-body">
              <tbody><tr>
                <td align="center" valign="top" width="100%" id="newsletter-section-body-cell">
                  
<div id="text-text-section-0">



<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="text-section section-content">
  <tbody><tr>
    <td valign="top" class="section-text-area section-content-cell padding-mobile-both" style="padding-top:11px;padding-right:44px;padding-bottom:11px;padding-left:44px;color:#313131;background-color:transparent;">
      <p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><a href="https://generativeai.net/newsletter" rel="nofollow" style="color:#1d8fb4 !important;">Sign Up</a> | <a href="https://www.udemy.com/course/generative-ai/?referralCode=6A16021D86142A4EAB93" rel="nofollow" style="color:#1d8fb4 !important;">GAI Course</a> | <a href="https://generativeai.net/contact-us" rel="nofollow" style="color:#1d8fb4 !important;">Sponsor</a></p>
    </td>
  </tr>
</tbody></table>

</div>
<div id="text-text-section-1">



<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="#FFFFFF" class="text-section section-content">
  <tbody><tr>
    <td valign="top" class="section-text-area section-content-cell" style="padding-top:0px;padding-right:22px;padding-bottom:0px;padding-left:22px;color:#000;background-color:#fff;">
      <h3 style="color:inherit;margin:1.414em 0 .5em;font-weight:400;line-height:1.25em;font-size:1.8744337499999997em;mso-line-height-alt:1.8744337499999997em;margin-top:0;margin-bottom:0;font-family:'Andale Mono', 'Lucida Console', 'DejaVu Sans Mono', 'Bitstream Vera Sans Mono', 'Liberation Mono', Courier, monospace;letter-spacing:-.02em;"><strong>Generative AI - Short &amp; Sweet 09</strong></h3>
    </td>
  </tr>
</tbody></table>

</div>
<div id="text-text-section-2">



<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="text-section section-content">
  <tbody><tr>
    <td valign="top" class="section-text-area section-content-cell" style="padding-top:44px;padding-right:22px;padding-bottom:44px;padding-left:22px;color:#545353;background-color:transparent;">
      <p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">First of all, apologies for skipping last week’s episode. I went on vacation and couldn’t write a post with the quality that I expect from myself. This week I am back in the right headspace and went wild on the keyboard. Happy reading.</p>
    </td>
  </tr>
</tbody></table>

</div>
<div id="text-text-section-3">



<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="text-section section-content">
  <tbody><tr>
    <td valign="top" class="section-text-area section-content-cell" style="padding-top:11px;padding-right:22px;padding-bottom:11px;padding-left:22px;color:#000;background-color:transparent;">
      <h4 style="color:inherit;margin:1.414em 0 .5em;font-weight:400;line-height:1.25em;font-size:1.3256249999999998em;mso-line-height-alt:1.3256249999999998em;margin-top:0;font-family:'Andale Mono', 'Lucida Console', 'DejaVu Sans Mono', 'Bitstream Vera Sans Mono', 'Liberation Mono', Courier, monospace;letter-spacing:.04em;">🔮 <strong>The GAI topic of the week is ..</strong></h4><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><strong>OpenAI’s Whisper.</strong> It is an Automatic Speech Recognition (ASR) system that aims to recognize what has been said and transcribes it to text.&nbsp;</p><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><span style="font-size:inherit;font-weight:inherit;line-height:inherit;margin:0;text-decoration:underline;">Tech terms to know</span> 📙<span style="font-size:inherit;font-weight:inherit;line-height:inherit;margin:0;text-decoration:underline;"><br></span>LLM = Large Language Model<br>GPT = Generative Pre-trained Transformer [1]<br>PaLM = Pathways Language Model [2]<br>Token = smaller text units like words, characters, or subwords.</p>
    </td>
  </tr>
</tbody></table>

</div>
<div id="text-text-section-4">



<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="text-section section-content">
  <tbody><tr>
    <td valign="top" class="section-text-area section-content-cell" style="padding-top:11px;padding-right:22px;padding-bottom:11px;padding-left:22px;color:#000;background-color:transparent;">
      <p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><span style="font-size:inherit;font-weight:inherit;line-height:inherit;margin:0;text-decoration:underline;">Whisper’s power</span> 🔥<br><strong>Its high accuracy and robustness.</strong> Compared to Siri, Alexa, and Google Assistant, Whisper understands fast-spoken, mumbling, or jargon-filled voice recordings very accurately. Andrej Karpathy, former director of AI at Tesla and OpenAI, now an independent researcher (that’s cool), has tested it and the results are striking. See his results [3].</p>
    </td>
  </tr>
</tbody></table>

</div>
<div id="image-image-section-below-5">
<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="image-section below-layout section-content">

  

  
    <tbody><tr>
      <td>
        <table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0">
          <tbody><tr>
              

            <td align="left" valign="middle" class="section-image-cell section-content-cell section-hoverable-image" data-aspect="ORIGINAL" style="padding:0;">
              
  <img class="section-scaleable-image" src="https://images.squarespace-cdn.com/content/5bfd6f322487fdb33ce53474/91e5d352-d3c8-497f-9c3a-31f4ff1cb214/Screenshot+2022-10-07+at+07.50.42.png?content-type=image%2Fpng&amp;format=750w" width="594" alt="" style="font-size:.6630127298444131em;display:block;border:0;text-decoration:none;line-height:0;background-color:transparent;font-weight:normal;height:auto;width:100%;max-width:100%;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">


            </td>
              

          </tr>
        </tbody></table>
      </td>
    </tr>
    
  
  


</tbody></table>

</div>
<div id="text-text-section-6">



<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="text-section section-content">
  <tbody><tr>
    <td valign="top" class="section-text-area section-content-cell" style="padding-top:11px;padding-right:22px;padding-bottom:11px;padding-left:22px;color:#000;background-color:transparent;">
      <p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">In the following figure, one can see that Whisper’s performance (left) is close to the performance of a professional human transcriber. It is best in class of LLMs (A-D in figure), but can’t beat computer-assisted (E in figure) transcription [6].</p>
    </td>
  </tr>
</tbody></table>

</div>
<div id="image-image-section-below-7">
<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="image-section below-layout section-content">

  
  <tbody><tr>
    <td class="spacing-above" height="44"></td>
  </tr>


  
    <tr>
      <td>
        <table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0">
          <tbody><tr>
              

            <td align="left" valign="middle" class="section-image-cell section-content-cell section-hoverable-image" data-aspect="ORIGINAL" style="padding:0;">
              
  <img class="section-scaleable-image" src="https://images.squarespace-cdn.com/content/5bfd6f322487fdb33ce53474/81cc0692-d260-4e97-86f2-5a8de852b98d/Screenshot+2022-10-06+at+09.33.49.png?content-type=image%2Fpng&amp;format=750w" width="594" alt="" style="font-size:.6630127298444131em;display:block;border:0;text-decoration:none;line-height:0;background-color:transparent;font-weight:normal;height:auto;width:100%;max-width:100%;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">


            </td>
              

          </tr>
        </tbody></table>
      </td>
    </tr>
    
  
  
  <tr>
    <td bgcolor="transparent" class="spacing-below" height="44"></td>
  </tr>



</tbody></table>

</div>
<div id="text-text-section-8">



<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="text-section section-content">
  <tbody><tr>
    <td valign="top" class="section-text-area section-content-cell" style="padding-top:11px;padding-right:22px;padding-bottom:11px;padding-left:22px;color:#000;background-color:transparent;">
      <p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><strong>It is easy to use.</strong> For example, go on the Hugging Face space that hosts Whisper [4], enable your mic, speak in whatever language you want to, and click transcribe. <br>I tested it in the following languages: German (my mother tongue), Polish (I am raised bilingual), English (my working language), and Italian (I am learning it right now). It worked like a charm. Whisper could even transcribe the Polish dialect, Silesian, correctly.</p><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><strong>Also, it is multilingual and multitasking,</strong> meaning an AI that performs multiple tasks at the same time. With regards to this, Whisper for example detects the language it is being presented with AND transcribes it to text. <br>There is a limit to this though. Whenever, I switched the language within a sentence, e.g. starting the sentence in German and ending in Polish, it would result in an error message.</p><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><strong>OpenAI open-sourced Whisper. </strong>They open-sourced code [5] and the respective paper [6]. It helps tremendously when companies disclose the code of their models. Implementing and tweaking the models is easier, utilizing as well as customizing their capabilities best. <br>However, OpenAI didn’t disclose the dataset that Whisper was trained on. 🤔</p><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><span style="font-size:inherit;font-weight:inherit;line-height:inherit;margin:0;text-decoration:underline;">Rumors about OpenAI’s data strategy</span> 🤐<strong><br></strong>Why wouldn’t they? Some say it is because of legal issues (web scraping can be tricky at times) and some say it’s because they want to monetize it later. There might be another reason though: the performance of upcoming LLMs with next-in-line GPT-4. Let me unpack.<br><br><strong>The 3 key aspects of improving an LLM.</strong> Generally speaking, there are 3 levers to get the most out of an LLM like GPT-3 [1] and PaLM [2], etc. For all 3 levers, the rule of thumb is the more, the better the performance. </p><ul data-rte-list="default" style="padding-left:25px;"><li style="font-weight:normal;margin-top:0px;margin-bottom:0px;margin-left:15px;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">Computing power.</p><ul data-rte-list="default" style="padding-left:25px;"><li style="font-weight:normal;margin-top:0px;margin-bottom:0px;margin-left:15px;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">Regarding OpenAI: they partnered up with Microsoft. So, there are virtually no computing limits.</p></li></ul></li><li style="font-weight:normal;margin-top:0px;margin-bottom:0px;margin-left:15px;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">Number of trainable parameters aka the size of a model.</p><ul data-rte-list="default" style="padding-left:25px;"><li style="font-weight:normal;margin-top:0px;margin-bottom:0px;margin-left:15px;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">Looking back at the LLMs developed, one can clearly recognize an upside trend in this field. It’s not a technical problem to further increase the model size, but it’s currently not helpful. I’m going to explain the Chinchilla scaling laws in just a second.</p></li></ul></li><li style="font-weight:normal;margin-top:0px;margin-bottom:0px;margin-left:15px;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">Data.</p><ul data-rte-list="default" style="padding-left:25px;"><li style="font-weight:normal;margin-top:0px;margin-bottom:0px;margin-left:15px;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">For all LLMs, this is currently the limiting factor.</p></li></ul></li></ul><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><br><strong>An Important insight from DeepMind.</strong> The London-based Google company DeepMind has investigated what the compute-optimal number of tokens for training a certain LLM size is. In simpler tokens 🫠, I have a model with X trainable parameters, how much training data do I need in order to have an optimally trained language model? These are the so-called Chinchilla scaling laws [7]. <br>In the table below it’s quite interesting to see that, for example, OpenAI’s GPT-3 model with 175B parameters would be compute-optimally trained if the training set would have 3.7T tokens. In fact, it is just trained on 300B tokens [8]. Is it now undertrained? Most likely, yes, but keep in mind that DeepMind published their work [7] after GPT-3’s release. Now, the world looks different.<br></p>
    </td>
  </tr>
</tbody></table>

</div>
<div id="image-image-section-below-9">
<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="image-section below-layout section-content">

  
  <tbody><tr>
    <td class="spacing-above" height="44"></td>
  </tr>


  
    <tr>
      <td>
        <table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0">
          <tbody><tr>
              

            <td align="left" valign="middle" class="section-image-cell section-content-cell section-hoverable-image" data-aspect="ORIGINAL" style="padding:0;">
              
  <img class="section-scaleable-image" src="https://images.squarespace-cdn.com/content/5bfd6f322487fdb33ce53474/5e389876-7753-4bfa-a1e6-ebf8992bc9cb/Screenshot+2022-10-05+at+22.00.10.png?content-type=image%2Fpng&amp;format=750w" width="594" alt="" style="font-size:.6630127298444131em;display:block;border:0;text-decoration:none;line-height:0;background-color:transparent;font-weight:normal;height:auto;width:100%;max-width:100%;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">


            </td>
              

          </tr>
        </tbody></table>
      </td>
    </tr>
    
  
  
  <tr>
    <td bgcolor="transparent" class="spacing-below" height="44"></td>
  </tr>



</tbody></table>

</div>
<div id="text-text-section-10">



<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="text-section section-content">
  <tbody><tr>
    <td valign="top" class="section-text-area section-content-cell" style="padding-top:11px;padding-right:22px;padding-bottom:11px;padding-left:22px;color:#000;background-color:transparent;">
      <p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><strong>OpenAI’s GPTs.</strong> OpenAI is known for its strong language models. When released, they outperform current state-of-the-art LLMs significantly. I.e. OpenAI released GPT in 2018, GPT-2 in 2019, and GPT-3 in 2020. GPT-4 has been announced, but is quite delayed, presumably due to the attention that DALL-E and CLIP have drawn in the last 18 months or so. Earlier I wrote AI image generation [9] to provide a big-picture perspective .<br>Assuming GPT-4 has at least the size of GPT-3 and taking the Chinchilla scaling laws into account, they would need 3.7T tokens for training. 12 times as much training data as OpenAI had available for GPT-3, and probably more.<br><br><strong>Training data is needed. </strong>OpenAI is missing training data. Moreover, I think it is a fair assumption that all other companies building next-gen LLMs are missing training data. <br>How to bridge the data gap? According to some resources [8], Wikipedia is around 3B tokens, accessible books around 67B tokens, and web crawls around 430B tokens, resulting in a little over 500B tokens. Still, 3.2T token missing. <br>Then comes synthetic data into play which should not provide the rest of the missing data, because of 2 reasons: first, current data augmentation models are good, but don’t provide enough data diversity to make up for 86% of the training data. Second, there is more real-world data out there. I am talking about video data. <br>Why not transcribe all available video data? This is deffo one of the main reasons why Whisper exists. There are well-reasoned estimates that Youtube alone has roughly 12T tokens [10]. As good fortune would have it, there is already a Hugging Face space that implemented a Youtube-Whisper model [11]. Plus, it’s fun to try it out.<br>I reckon it’s better to stop here, as I will follow up on this once GPT-4 is out.</p>
    </td>
  </tr>
</tbody></table>

</div>
<div id="image-image-section-side-11">
<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" align="center" bgcolor="#FFFFFF" class="image-section side-layout section-content" style="width:100% !important;">

  
  <tbody><tr>
    <td class="spacing-above" height="44"></td>
  </tr>


  
    
    <tr><td><table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" align="center" bgcolor="#FFFFFF" class="side-layout" style="width:100% !important;"><tbody><tr>

    

  <th class="stack-cell-wrap w100p section-image-cell section-content-cell section-hoverable-image" align="left" data-aspect="ORIGINAL" style="padding:0;width:66%;vertical-align:middle;font-weight:normal;">
    
  <img class="section-scaleable-image" src="https://images.squarespace-cdn.com/content/5bfd6f322487fdb33ce53474/a41a5c61-e8cf-4521-bedc-3eefffb545e9/DALL%25C2%25B7E%2B2022-10-06%2B16.47.57%2B-%2Bartsy%2Boilpainting%2Babout%2Ba%2Bperson%2Bthat%2Bunderstands%2Ball%2Blanguages.%2Bthis%2Bperson%2Btakes%2Bhis%2Bhand%2Bbehind%2Bthe%2Bear%2Band%2Blistens.%2Balso%2Bthis%2Bperson%2Bhas%2Ba%2Bfish%2Bin.jpg?content-type=image%2Fjpeg&amp;format=750w" width="297" alt="My DALL-E prompt:
&quot;artsy oilpainting about a person that understands all languages. this person takes his hand behind the ear and listens. also this person has a fish in its ear. it is a coloful picture.&quot;" style="font-size:.6630127298444131em;display:block;border:0;text-decoration:none;line-height:0;background-color:transparent;font-weight:normal;height:auto;width:100%;max-width:100%;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">


  </th>
    

  <th class="stack-cell-wrap w100p section-text-area section-content-cell" align="left" style="color:#000;vertical-align:middle;font-weight:normal;">
    <table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" align="center" class="side-layout" style="width:100% !important;"><tbody><tr><td class="section-text-cell" style="padding-top:22px;padding-right:22px;padding-bottom:22px;padding-left:22px;">
      <div class="section-caption-text" style="position:relative;"><p class="" style="font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;color:#313131;">My DALL-E prompt:<br><em>artsy oilpainting about a person that understands all languages. this person takes his hand behind the ear and listens. also this person has a fish in its ear. it is a colorful picture.</em></p></div>
    </td></tr></tbody></table>
  </th>
    

</tr></tbody></table></td></tr>


    
  
  
  <tr>
    <td bgcolor="#FFFFFF" class="spacing-below" height="44"></td>
  </tr>



</tbody></table>

</div>
<div id="text-text-section-12">



<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="text-section section-content">
  <tbody><tr>
    <td valign="top" class="section-text-area section-content-cell" style="padding-top:22px;padding-right:22px;padding-bottom:11px;padding-left:22px;color:#313131;background-color:transparent;">
      <p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><strong>What could Whisper’s impact be? </strong>💡<br>Besides the point I made above about how Whisper is a strategic move in order to get bigger and better datasets, there is a plethora of other applications to think about. </p><ul data-rte-list="default" style="padding-left:25px;"><li style="font-weight:normal;margin-top:0px;margin-bottom:0px;margin-left:15px;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">Imagine you could take study notes with your voice without having to check them constantly.</p></li><li style="font-weight:normal;margin-top:0px;margin-bottom:0px;margin-left:15px;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">Accurate subtitles in videos/ movies for all languages.</p></li><li style="font-weight:normal;margin-top:0px;margin-bottom:0px;margin-left:15px;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">Whisper could signify a life quality improvement for people with speech or hearing impairment. For instance, you could instantly transcribe your words for a deaf person.</p></li><li style="font-weight:normal;margin-top:0px;margin-bottom:0px;margin-left:15px;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">Further, to language barriers, do you know/ remember the movie <em>The Hitchhiker’s Guide to the Galaxy</em>? There was the Babelfish [12], a fish that once you stick it in your ear translates every galactic language in realtime. Imagine a headphone-like device that tears down all language barriers. And, it is even called Whisper!</p></li><li style="font-weight:normal;margin-top:0px;margin-bottom:0px;margin-left:15px;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">Lastly, just think about the innumerable applications in law, healthcare, banking, marketing, education. There are plenty of ways how companies could integrate Whisper into existing services. </p></li></ul><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">What other applications seem obvious to you? </p><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;height:1.618em;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"></p><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><strong>Generative AI Top 3 Gems </strong>💎 </p><ol data-rte-list="default" style="padding-left:25px;"><li style="font-weight:normal;margin-top:0px;margin-bottom:0px;margin-left:15px;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><a href="https://developer.nvidia.com/maxine#nvidia-maxine" rel="nofollow" style="color:#1d8fb4 !important;">NVidia Maxine</a> for real-time audio and video communication. Particularly interesting is the <a href="https://developer.nvidia.com/maxine#ae-sdk" rel="nofollow" style="color:#1d8fb4 !important;">feature for turning on/ off the eye contact</a> of the other person, improving personal touch in remote video calls.</p></li><li style="font-weight:normal;margin-top:0px;margin-bottom:0px;margin-left:15px;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">Editorial feature from Google Arts &amp; Culture: <a href="https://artsandculture.google.com/story/VwVhbAD7QslgLA" rel="nofollow" style="color:#1d8fb4 !important;">12 great AI-created songs</a>. The whole web page is a piece of art, I think.</p></li><li style="font-weight:normal;margin-top:0px;margin-bottom:0px;margin-left:15px;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">This <a href="https://christiancantrell.com#ai-ml" rel="nofollow" style="color:#1d8fb4 !important;">Photoshop Plugin</a> integrates stable diffusion. You can generate high-quality images in the tool like you do with DALL-E, Parti AI, and other models, see [13].</p></li></ol><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;height:1.618em;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"></p>
    </td>
  </tr>
</tbody></table>

</div>
<div id="text-text-section-13">



<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="text-section section-content">
  <tbody><tr>
    <td valign="top" class="section-text-area section-content-cell" style="padding-top:11px;padding-right:22px;padding-bottom:11px;padding-left:22px;color:#313131;background-color:transparent;">
      <p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">Subscribing to, giving feedback about, and sharing the <a href="https://generativeai.net/newsletter" rel="nofollow" style="color:#1d8fb4 !important;">newsletter</a> as well as our <a href="https://www.udemy.com/course/generative-ai/?referralCode=6A16021D86142A4EAB93" rel="nofollow" style="color:#1d8fb4 !important;">renowned online course</a> will be highly appreciated and helps a lot. 🌝</p><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">You know about 💎 GAI Gems that we should consider? Or other matters? <br>Please, respond to this email.</p><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">Thank you for reading, </p><p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;">Martin </p>
    </td>
  </tr>
</tbody></table>

</div>
<div id="line-line-section-14">

<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="line-section section-content">
  <tbody><tr>
    <td align="center" valign="middle" width="100%">
      <table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" class="line-section-table section-content" style="width:20%;min-width:20%;">
        <tbody><tr>
          <td align="center" valign="middle" class="section-content-cell" width="100%" style="padding-top:22px;padding-right:0;padding-bottom:22px;padding-left:0;">
            <div class="basic-line" data-line="solid" style="background:none;font-size:0;margin:0;line-height:0;height:0;width:100%;border-style:solid none;border-width:1px 0 0px;border-color:#000;">&nbsp;</div>
          </td>
        </tr>
      </tbody></table>
    </td>
  </tr>
</tbody></table>

</div>
<div id="text-text-section-15">



<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="text-section section-content">
  <tbody><tr>
    <td valign="top" class="section-text-area section-content-cell" style="padding-top:11px;padding-right:22px;padding-bottom:11px;padding-left:22px;color:#313131;background-color:transparent;">
      <p class="" style="color:inherit;font-size:.9375em;line-height:1.618em;margin:0 0 1.25em 0;font-weight:normal;margin-top:0;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;"><strong>References:</strong><br>[1] <a href="https://en.wikipedia.org/wiki/GPT-3" rel="nofollow" style="color:#1d8fb4 !important;">OpenAI’s language model GPT-3</a>.<br>[2] <a href="https://ai.googleblog.com/2022/04/pathways-language-model-palm-scaling-to.html" rel="nofollow" style="color:#1d8fb4 !important;">Google’s Pathways Language Model</a>.<br>[3] <a href="https://twitter.com/karpathy/status/1573123790795837440" rel="nofollow" style="color:#1d8fb4 !important;">Andrej plays with Whisper</a>.<br>[4] <a href="https://huggingface.co/spaces/openai/whisper" rel="nofollow" style="color:#1d8fb4 !important;">Hugging Face Demo</a>. <br>[5] <a href="https://github.com/openai/whisper" rel="nofollow" style="color:#1d8fb4 !important;">Whisper’s code</a>.<br>[6] <a href="https://cdn.openai.com/papers/whisper.pdf" rel="nofollow" style="color:#1d8fb4 !important;">OpenAI’s paper about Whisper</a>.<br>[7] <a href="https://arxiv.org/abs/2203.15556" rel="nofollow" style="color:#1d8fb4 !important;">DeepMind’s paper: Training Compute-Optimal Large Language Models</a>.<br>[8] <a href="https://www.sigmoid.com/blogs/gpt-3-all-you-need-to-know-about-the-ai-language-model/" rel="nofollow" style="color:#1d8fb4 !important;">GPT-3: all you need to know</a>. <br>[9] <a href="https://generativeai.net/campaigns/view-campaign/vgJ0VNygbSL1BnEtxvMrWjOtn_CgjUhNcncVkcz4xaNTaSOY8YdCI6IEXUS6Hn2_wYm-_xXpjrtV927nxjRzapOoFxboClzI" rel="nofollow" style="color:#1d8fb4 !important;">Episode 2 of this newsletter about AI image generation</a>.<br>[10] <a href="https://twitter.com/HenriLemoine13/status/1572846452895875073?utm_medium=email&amp;utm_source=substack" rel="nofollow" style="color:#1d8fb4 !important;">Estimates how many tokens there are in Youtube</a>.<br>[11] <a href="https://huggingface.co/spaces/jeffistyping/Youtube-Whisperer" rel="nofollow" style="color:#1d8fb4 !important;">Hugging Face space for Youtube-Whisperer</a>.<br>[12] <a href="https://www.youtube.com/watch?v=YWqHkYtREAE" rel="nofollow" style="color:#1d8fb4 !important;">Babelfish in The Hitchhiker’s Guide to the Galaxy - video</a>.<br>[13] <a href="https://colab.research.google.com/github/alembics/disco-diffusion/blob/main/Disco_Diffusion.ipynb" rel="nofollow" style="color:#1d8fb4 !important;">Ipython Notebook to try it out yourself.</a></p>
    </td>
  </tr>
</tbody></table>

</div>
<div id="line-line-section-16">

<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="line-section section-content">
  <tbody><tr>
    <td align="center" valign="middle" width="100%">
      <table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" class="line-section-table section-content" style="width:93%;min-width:93%;">
        <tbody><tr>
          <td align="center" valign="middle" class="section-content-cell" width="100%" style="padding-top:22px;padding-right:0;padding-bottom:22px;padding-left:0;">
            <div class="basic-line" data-line="solid" style="background:none;font-size:0;margin:0;line-height:0;height:0;width:100%;border-style:solid none;border-width:1px 0 1px;border-color:#000;">&nbsp;</div>
          </td>
        </tr>
      </tbody></table>
    </td>
  </tr>
</tbody></table>

</div>
                </td>
              </tr>
            </tbody></table>
            
              <table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" id="newsletter-section-footer">
                <tbody><tr>
                  <td align="center" valign="top" id="newsletter-section-footer-cell">
                    
<div id="footer-footer-section-split-right-0">



<table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="footer-section footer-section-split section-content" style="background-color:transparent;">
  <tbody><tr>
    <td align="left" valign="top" class="section-text-area section-content-cell" style="padding-top:0px;padding-right:22px;padding-bottom:0px;padding-left:22px;">
      <table role="presentation" width="100%" cellpadding="0" cellspacing="0" border="0" bgcolor="transparent" class="footer-section footer-section-split section-content" style="background-color:transparent;">
        <tbody><tr>
          <th align="left" valign="top" class="stack-cell-down w100p section-text-area" style="width:50%;">
            

            
            
  
  <p class="footer-company-info" style="line-height:1.618em;font-weight:normal;margin-top:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;color:#000;font-size:11px;margin:0 0 13.75px 0;padding:0;"><a style="color:#000;text-decoration:none;font-size:inherit;font-family:inherit;font-weight:inherit;line-height:inherit;cursor:default;">
    
      GenerativeAI.net<br>
    
    
      Nymphenburger Straße <br>
    
    
      Munich<br>
    
    
      Germany
    
  </a></p>
  

            
<p class="footer-links" style="line-height:1.618em;font-weight:normal;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;color:#000;font-size:11px;margin:0 0 13.75px 0;padding:0;">
  Powered by <a href="https://www.squarespace.com?channel=product_refer&amp;subchannel=customer&amp;source=email_campaigns_button&amp;campaign=5bfd6f322487fdb33ce53474&amp;utm_medium=product_refer&amp;utm_source=email_campaigns_button" class="sqsp-link" style="color:#000;text-decoration:underline;display:inline-block;">Squarespace</a>
</p>


            <p class="footer-links" style="line-height:1.618em;font-weight:normal;margin-bottom:0;font-family:'Segoe UI', Candara, 'Bitstream Vera Sans', 'DejaVu Sans', 'Trebuchet MS', Verdana, sans-serif;color:#000;font-size:11px;margin:0 0 13.75px 0;padding:0;">
  <a href="#" class="unsubscribe-link" style="text-decoration:underline;color:#313131;">
    <span class="unsubscribe-link-text" style="font-size:inherit;font-weight:inherit;line-height:inherit;margin:0;">Unsubscribe</span>
  </a>
</p>

          </th>
          <th align="right" valign="top" class="stack-cell-up w100p text-left section-text-area" style="width:50%;text-align:right;">
            
  
  
  
    
  

          </th>
        </tr>
      </tbody></table>
    </td>
  </tr>
</tbody></table>

</div>
                  </td>
                </tr>
              </tbody></table>
            
          </td>
        </tr>
      </tbody></table>
    </td>
  </tr>
</tbody></table>

  
</body></html>
