<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet href="/rss.xsl" type="text/xsl"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom" xmlns:fh="http://purl.org/syndication/history/1.0">
  <channel>
    <title>Posts tagged: data Archive</title>
    <link>https://go.waylonwalker.com/tags/data/</link>
    <description>All posts with the tag &#34;data&#34;</description>
    <lastBuildDate>Mon, 09 Jun 2025 13:31:30 +0000</lastBuildDate>
    <generator>markata-go</generator>
    <docs>https://www.rssboard.org/rss-specification</docs>
    <atom:link href="https://go.waylonwalker.com/tags/data/archive/rss.xml" rel="self" type="application/rss+xml"></atom:link>
    <atom:link href="https://go.waylonwalker.com/tags/data/rss.xml" rel="current" type="application/rss+xml"></atom:link>
    <fh:complete></fh:complete>
    <item>
      <title>💭 Taming file zoos: Data science with DuckDB database files - Al...</title>
      <link>https://go.waylonwalker.com/thought-681/</link>
      <description>!https://www.youtube.com/watch?v=Yq-hxgysWLQ</description>
      <pubDate>Mon, 09 Jun 2025 13:31:30 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-681/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>data</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 hotel_bookings.csv</title>
      <link>https://go.waylonwalker.com/thought-583/</link>
      <description>!https://www.kaggle.com/datasets/ahmedsafwatgb20/hotel-bookingscsv?resource=download</description>
      <pubDate>Sat, 15 Mar 2025 22:32:44 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-583/</guid>
      <author>hello@waylonwalker.com</author>
      <category>data</category>
      <category>thought</category>
    </item>
    <item>
      <title>sqlite vacuum</title>
      <link>https://go.waylonwalker.com/sqlite-vacuum/</link>
      <description>Today I learned how to VACUUM a sqlite database and cut its size in about half. It&#39;s a database that I have had running for quite awhile and has some decent...</description>
      <pubDate>Tue, 16 Apr 2024 21:31:24 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/sqlite-vacuum/</guid>
      <author>hello@waylonwalker.com</author>
      <category>data</category>
    </item>
    <item>
      <title>💭 searching my thoughts locally</title>
      <link>https://go.waylonwalker.com/thought-211/</link>
      <description>!None</description>
      <pubDate>Thu, 07 Mar 2024 23:42:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-211/</guid>
      <author>hello@waylonwalker.com</author>
      <category>sqlite</category>
      <category>data</category>
      <category>blog</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 Open source, not open contribution with Ben Johnson (Changelog...</title>
      <link>https://go.waylonwalker.com/thought-122/</link>
      <description>!https://changelog.com/podcast/433</description>
      <pubDate>Thu, 05 Oct 2023 01:11:19 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-122/</guid>
      <author>hello@waylonwalker.com</author>
      <category>sqlite</category>
      <category>data</category>
      <category>database</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 DjangoCon Europe 2023 | Use SQLite in production - YouTube</title>
      <link>https://go.waylonwalker.com/thought-120/</link>
      <description>!https://www.youtube.com/watch?v=yTicYJDT1zE&amp;t=2s</description>
      <pubDate>Tue, 03 Oct 2023 13:22:19 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-120/</guid>
      <author>hello@waylonwalker.com</author>
      <category>sqlite</category>
      <category>data</category>
      <category>database</category>
      <category>thought</category>
    </item>
    <item>
      <title>Set up minio bucket entrypoint</title>
      <link>https://go.waylonwalker.com/set-up-minio-bucket-entrypoint/</link>
      <description>I recently se tup minio object storage in my homelab for litestream sqlite backups. The litestream quickstart made it easy to get everything up and running...</description>
      <pubDate>Sun, 01 Oct 2023 20:11:51 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/set-up-minio-bucket-entrypoint/</guid>
      <author>hello@waylonwalker.com</author>
      <category>data</category>
    </item>
    <item>
      <title>💭 benbjohnson/litestream: Streaming replication for SQLite.</title>
      <link>https://go.waylonwalker.com/thought-119/</link>
      <description>!https://github.com/benbjohnson/litestream</description>
      <pubDate>Sun, 01 Oct 2023 02:19:18 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-119/</guid>
      <author>hello@waylonwalker.com</author>
      <category>sqlite</category>
      <category>data</category>
      <category>database</category>
      <category>thought</category>
    </item>
    <item>
      <title>why-is-postgres-default</title>
      <link>https://go.waylonwalker.com/why-is-postgres-default/</link>
      <description>Serious question.</description>
      <pubDate>Sat, 30 Sep 2023 21:26:36 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/why-is-postgres-default/</guid>
      <author>hello@waylonwalker.com</author>
      <category>webdev</category>
      <category>data</category>
    </item>
    <item>
      <title>💭 Why I Built Litestream - Litestream</title>
      <link>https://go.waylonwalker.com/thought-118/</link>
      <description>!https://litestream.io/blog/why-i-built-litestream/</description>
      <pubDate>Sat, 30 Sep 2023 16:16:47 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-118/</guid>
      <author>hello@waylonwalker.com</author>
      <category>sqlite</category>
      <category>data</category>
      <category>database</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 I&#39;m All-In on Server-Side SQLite · The Fly Blog</title>
      <link>https://go.waylonwalker.com/thought-117/</link>
      <description>!https://fly.io/blog/all-in-on-sqlite-litestream/</description>
      <pubDate>Sat, 30 Sep 2023 14:54:33 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-117/</guid>
      <author>hello@waylonwalker.com</author>
      <category>sqlite</category>
      <category>data</category>
      <category>database</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 LiteFS Cloud: Distributed SQLite with Managed Backups · The Fl...</title>
      <link>https://go.waylonwalker.com/thought-116/</link>
      <description>!https://fly.io/blog/litefs-cloud/</description>
      <pubDate>Sat, 30 Sep 2023 14:49:41 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-116/</guid>
      <author>hello@waylonwalker.com</author>
      <category>sqlite</category>
      <category>data</category>
      <category>database</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 SQLite FTS5 Extension</title>
      <link>https://go.waylonwalker.com/thought-96/</link>
      <description>!https://www.sqlite.org/fts5.html</description>
      <pubDate>Mon, 21 Aug 2023 13:33:24 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-96/</guid>
      <author>hello@waylonwalker.com</author>
      <category>sqlite</category>
      <category>data</category>
      <category>database</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 simonw/datasette-render-markdown: Datasette plugin for renderi...</title>
      <link>https://go.waylonwalker.com/thought-90/</link>
      <description>!https://github.com/simonw/datasette-render-markdown</description>
      <pubDate>Wed, 16 Aug 2023 00:48:07 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-90/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>data</category>
      <category>database</category>
      <category>sqlite</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 `ValueError: Constraint must have a name` in alembic 1.10.0 · ...</title>
      <link>https://go.waylonwalker.com/thought-71/</link>
      <description>!https://github.com/sqlalchemy/alembic/issues/1195</description>
      <pubDate>Sat, 05 Aug 2023 01:25:07 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-71/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>data</category>
      <category>database</category>
      <category>alembic</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 Use Alembic Check to check for possible upgrades</title>
      <link>https://go.waylonwalker.com/thought-70/</link>
      <description>!None</description>
      <pubDate>Sat, 05 Aug 2023 01:22:06 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-70/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>data</category>
      <category>database</category>
      <category>alembic</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 DuckDB vs. MotherDuck — should you switch to the cloud version...</title>
      <link>https://go.waylonwalker.com/thought-63/</link>
      <description>!https://kestra.io/blogs/2023-07-28-duckdb-vs-motherduck</description>
      <pubDate>Mon, 31 Jul 2023 22:36:12 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-63/</guid>
      <author>hello@waylonwalker.com</author>
      <category>data</category>
      <category>database</category>
      <category>duckdb</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 s3-tree · PyPI</title>
      <link>https://go.waylonwalker.com/thought-61/</link>
      <description>!https://pypi.org/project/s3-tree/</description>
      <pubDate>Sun, 30 Jul 2023 14:37:06 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-61/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>cloud</category>
      <category>data</category>
      <category>s3</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 kndndrj/nvim-dbee: Interactive database client for neovim</title>
      <link>https://go.waylonwalker.com/thought-59/</link>
      <description>!https://github.com/kndndrj/nvim-dbee</description>
      <pubDate>Sat, 29 Jul 2023 01:08:20 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-59/</guid>
      <author>hello@waylonwalker.com</author>
      <category>nvim</category>
      <category>data</category>
      <category>database</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 sqlite-utils now supports plugins</title>
      <link>https://go.waylonwalker.com/thought-49/</link>
      <description>!https://simonwillison.net/2023/Jul/24/sqlite-utils-plugins/</description>
      <pubDate>Fri, 28 Jul 2023 14:59:37 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-49/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>data</category>
      <category>sql</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 Harlequin SQL IDE - DuckDB</title>
      <link>https://go.waylonwalker.com/thought-35/</link>
      <description>!https://duckdb.org/docs/guides/sql_editors/harlequin</description>
      <pubDate>Fri, 28 Jul 2023 14:59:37 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-35/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>data</category>
      <category>duckdb</category>
      <category>textual</category>
      <category>harlequin</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 Python API - DuckDB</title>
      <link>https://go.waylonwalker.com/thought-34/</link>
      <description>!https://duckdb.org/docs/api/python/overview.html</description>
      <pubDate>Fri, 28 Jul 2023 14:59:37 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-34/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>data</category>
      <category>duckdb</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 SQL on Pandas - DuckDB</title>
      <link>https://go.waylonwalker.com/thought-33/</link>
      <description>!https://duckdb.org/docs/guides/python/sql_pandas</description>
      <pubDate>Fri, 28 Jul 2023 14:59:37 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-33/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>data</category>
      <category>duckdb</category>
      <category>pandas</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 Full-text search - Datasette documentation</title>
      <link>https://go.waylonwalker.com/thought-13/</link>
      <description>!https://docs.datasette.io/en/latest/full_search.html#enabling-full-text-search-for-a-sqlite-table</description>
      <pubDate>Fri, 28 Jul 2023 14:59:37 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-13/</guid>
      <author>hello@waylonwalker.com</author>
      <category>sqlite</category>
      <category>data</category>
      <category>database</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 sqlite-utils command-line tool - sqlite-utils</title>
      <link>https://go.waylonwalker.com/thought-12/</link>
      <description>!https://sqlite-utils.datasette.io/en/stable/cli.html#querying-data-directly-using-an-in-memory-database</description>
      <pubDate>Fri, 28 Jul 2023 14:59:37 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-12/</guid>
      <author>hello@waylonwalker.com</author>
      <category>sqlite</category>
      <category>data</category>
      <category>database</category>
      <category>sql</category>
      <category>json</category>
      <category>thought</category>
    </item>
    <item>
      <title>💭 sqlite-utils command-line tool - sqlite-utils</title>
      <link>https://go.waylonwalker.com/thought-11/</link>
      <description>!https://sqlite-utils.datasette.io/en/stable/cli.html#inserting-json-data</description>
      <pubDate>Fri, 28 Jul 2023 14:59:37 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/thought-11/</guid>
      <author>hello@waylonwalker.com</author>
      <category>sqlite</category>
      <category>data</category>
      <category>database</category>
      <category>thought</category>
    </item>
    <item>
      <title>Zev Averbach Interview</title>
      <link>https://go.waylonwalker.com/zev-averbach-interview/</link>
      <description>Zev Averbach, _</description>
      <pubDate>Fri, 09 Apr 2021 17:40:42 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/zev-averbach-interview/</guid>
      <author>hello@waylonwalker.com</author>
      <category>data</category>
      <category>python</category>
    </item>
    <item>
      <title>Minimal Kedro Pipeline</title>
      <link>https://go.waylonwalker.com/minimal-kedro-pipeline/</link>
      <description>How small can a minimum kedro pipeline ready to package be? I made one within 4 files that you can pip install. It&#39;s only a total of 35 lines of python, 8 in...</description>
      <pubDate>Wed, 20 Jan 2021 00:00:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/minimal-kedro-pipeline/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>kedro</category>
      <category>data</category>
    </item>
    <item>
      <title>Blog Data With Python</title>
      <link>https://go.waylonwalker.com/blog-data-with-python/</link>
      <description>Generating an api for a blog is much simpler than one might expect with python.</description>
      <pubDate>Mon, 18 Jan 2021 00:00:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/blog-data-with-python/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>blog</category>
      <category>data</category>
    </item>
    <item>
      <title>Kedro - My Data Is Not A Table</title>
      <link>https://go.waylonwalker.com/kedro-pickle/</link>
      <description>In python data science/engineering most of our data is in the form of some sort of table, typically a DataFrame from a library like pandas, spark, or dask.</description>
      <pubDate>Thu, 14 Jan 2021 00:00:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/kedro-pickle/</guid>
      <author>hello@waylonwalker.com</author>
      <category>kedro</category>
      <category>python</category>
      <category>data</category>
    </item>
    <item>
      <title>Gracefully adopt kedro, the catalog</title>
      <link>https://go.waylonwalker.com/graceful-kedro-catalog/</link>
      <description>While using the catalog alone will not reap all of the benefits of the framework, it does get you and your project ready for the full framework eventually....</description>
      <pubDate>Mon, 29 Jun 2020 03:00:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/graceful-kedro-catalog/</guid>
      <author>hello@waylonwalker.com</author>
      <category>kedro</category>
      <category>python</category>
      <category>data</category>
    </item>
    <item>
      <title>How to find things in your kedro catalog</title>
      <link>https://go.waylonwalker.com/kedro-catalog-search/</link>
      <description>kedro 0.16.2 just dropped last week with a long-awaited feature... **! I went as far as monkey patching this into each of my projects. I work jump between a...</description>
      <pubDate>Mon, 22 Jun 2020 03:00:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/kedro-catalog-search/</guid>
      <author>hello@waylonwalker.com</author>
      <category>kedro</category>
      <category>python</category>
      <category>data</category>
    </item>
    <item>
      <title>How Kedro handles your inputs</title>
      <link>https://go.waylonwalker.com/kedro-inputs/</link>
      <description>Passing inputs into kedro is a key concept. Understanding how it accepts a single catalog key as input is quite trivial that easily makes sense, but passing...</description>
      <pubDate>Fri, 19 Jun 2020 03:00:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/kedro-inputs/</guid>
      <author>hello@waylonwalker.com</author>
      <category>kedro</category>
      <category>python</category>
      <category>data</category>
    </item>
    <item>
      <title>011</title>
      <link>https://go.waylonwalker.com/011/</link>
      <description>Load _ from database into **</description>
      <pubDate>Sun, 07 Jun 2020 02:09:58 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/011/</guid>
      <author>hello@waylonwalker.com</author>
      <category>data</category>
      <category>python</category>
    </item>
    <item>
      <title>010</title>
      <link>https://go.waylonwalker.com/010/</link>
      <description>load remote _ with **</description>
      <pubDate>Sun, 07 Jun 2020 02:07:13 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/010/</guid>
      <author>hello@waylonwalker.com</author>
      <category>data</category>
      <category>python</category>
    </item>
    <item>
      <title>009</title>
      <link>https://go.waylonwalker.com/009/</link>
      <description>Combine a directory of _ with **</description>
      <pubDate>Sun, 07 Jun 2020 02:02:58 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/009/</guid>
      <author>hello@waylonwalker.com</author>
      <category>data</category>
      <category>python</category>
    </item>
    <item>
      <title>Create Custom Kedro Dataset</title>
      <link>https://go.waylonwalker.com/create-custom-kedro-dataset/</link>
      <description>Kedro provides an efficient way to build out data catalogs with their yaml api. It allows you to be very declaritive about loading and saving your data. For...</description>
      <pubDate>Fri, 15 May 2020 05:00:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/create-custom-kedro-dataset/</guid>
      <author>hello@waylonwalker.com</author>
      <category>kedro</category>
      <category>python</category>
      <category>data</category>
    </item>
    <item>
      <title>What is YOUR Advice for New Data Scientists</title>
      <link>https://go.waylonwalker.com/data-scientist-advice/</link>
      <description>Learn Git * Keep Learning</description>
      <pubDate>Wed, 26 Feb 2020 12:55:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/data-scientist-advice/</guid>
      <author>hello@waylonwalker.com</author>
      <category>data</category>
    </item>
    <item>
      <title>Filtering Pandas</title>
      <link>https://go.waylonwalker.com/filtering-pandas/</link>
      <description>Filtering pandas DataFrames many different ways.</description>
      <pubDate>Tue, 24 Sep 2019 05:00:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/filtering-pandas/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>data</category>
    </item>
    <item>
      <title>Clean up Your Data Science with Named Tuples</title>
      <link>https://go.waylonwalker.com/named-tuples-data-science/</link>
      <description>If you are a regular listener of TalkPython or PythonBytes you have hear Michael Kennedy talk about Named Tuples many times, but what are they and how do...</description>
      <pubDate>Wed, 11 Sep 2019 00:00:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/named-tuples-data-science/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>data</category>
    </item>
    <item>
      <title>Background Tasks in Python for Data Science</title>
      <link>https://go.waylonwalker.com/python-data-science-background/</link>
      <description>This post is intended as an extension/update from background tasks in python. I started using the week that Kenneth Reitz released it. It takes away so much...</description>
      <pubDate>Tue, 10 Sep 2019 05:00:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/python-data-science-background/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>data</category>
    </item>
    <item>
      <title>Generating Readme Tables From Pandas</title>
      <link>https://go.waylonwalker.com/readme-tables/</link>
      <description>none</description>
      <pubDate>Wed, 16 May 2018 00:00:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/readme-tables/</guid>
      <author>hello@waylonwalker.com</author>
      <category>data</category>
      <category>python</category>
    </item>
    <item>
      <title>Stepping Up My SQL Game</title>
      <link>https://go.waylonwalker.com/datacamp-sql/</link>
      <description>none</description>
      <pubDate>Sun, 25 Mar 2018 00:00:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/datacamp-sql/</guid>
      <author>hello@waylonwalker.com</author>
      <category>data</category>
      <category>sql</category>
    </item>
    <item>
      <title>background tasks in python</title>
      <link>https://go.waylonwalker.com/background-1/</link>
      <description>none</description>
      <pubDate>Sat, 16 Sep 2017 00:00:00 +0000</pubDate>
      <guid isPermaLink="true">https://go.waylonwalker.com/background-1/</guid>
      <author>hello@waylonwalker.com</author>
      <category>python</category>
      <category>data</category>
    </item>
  </channel>
</rss>