<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    
    <title>Rahul Baburajan</title>
    
    
    <description>This website is a virtual proof that I&apos;m awesome</description>
    
    <link>https://kaminocode.github.io/</link>
    <atom:link href="https://kaminocode.github.io/feed.xml" rel="self" type="application/rss+xml" />
    
    
      <item>
        <title>Cleaning text data with regex</title>
        <description>
          Why regex is a superhero in the LLM world - 
          Regular expressions (regex) are indispensable in the realm of data cleaning and preparation, particularly for Language Learning Models (LLMs) in natural language processing. The majority of data available, especially from extensive sources like Project Gutenberg, is often unstructured and cluttered with extraneous information. Regex excels in such environments, providing a...
        </description>
        <pubDate>Tue, 06 Sep 2022 00:00:00 -0400</pubDate>
        <link>https://kaminocode.github.io/2022-09-06-regex-medium/</link>
        <guid isPermaLink="true">https://kaminocode.github.io/2022-09-06-regex-medium/</guid>
      </item>
    
  </channel>
</rss>
