<?xml version="1.0" encoding="UTF-8" ?>
<rss version="2.0">
    <channel>
      <title>Nhox&#039;s notes</title>
      <link>https://blog.nhoxanboc.work</link>
      <description>Last 10 notes on Nhox&#039;s notes</description>
      <generator>Quartz -- quartz.jzhao.xyz</generator>
      <item>
    <title>Chap 1</title>
    <link>https://blog.nhoxanboc.work/spark/spark_chap1</link>
    <guid>https://blog.nhoxanboc.work/spark/spark_chap1</guid>
    <description><![CDATA[  Apache Spark is an Open source analytics engine for large-scale data processing” and machine learning applications Spark can process an increasingly vast amount of data by scaling out (across multiple smaller machines) instead of scaling up Spark Cluster │ ├── Node 1 ──┐ ├── Node 2 ──┼──► Master ──... ]]></description>
    <pubDate>Fri, 29 May 2026 00:04:40 GMT</pubDate>
  </item><item>
    <title>Chap 2</title>
    <link>https://blog.nhoxanboc.work/spark/spark_chap2</link>
    <guid>https://blog.nhoxanboc.work/spark/spark_chap2</guid>
    <description><![CDATA[ RDD vs Data Frame. ]]></description>
    <pubDate>Fri, 29 May 2026 00:04:40 GMT</pubDate>
  </item><item>
    <title>Spark</title>
    <link>https://blog.nhoxanboc.work/spark/</link>
    <guid>https://blog.nhoxanboc.work/spark/</guid>
    <description><![CDATA[  Everything I know about Spark a distributed engine processing . ]]></description>
    <pubDate>Tue, 26 May 2026 15:40:04 GMT</pubDate>
  </item><item>
    <title>Cache vs Buffer</title>
    <link>https://blog.nhoxanboc.work/cache_buffer</link>
    <guid>https://blog.nhoxanboc.work/cache_buffer</guid>
    <description><![CDATA[ Cache Store data for reuse --- data saved to avoid recomputing or re-fetching Buffer Store data in transit I/O Buffer Your app writes data: app → [buffer] → disk Without buffer: With buffer: write 1 byte → disk collect 1000 writes in buffer write 1 byte → disk → flush to disk in one operation write ... ]]></description>
    <pubDate>Mon, 18 May 2026 15:59:31 GMT</pubDate>
  </item><item>
    <title>Interview Questions</title>
    <link>https://blog.nhoxanboc.work/interview_prep</link>
    <guid>https://blog.nhoxanboc.work/interview_prep</guid>
    <description><![CDATA[ Q1: What did you do to improve yourself ? weqweqeq Q2: How to presennt/ make non technical stakeholder understand the data/ logic ? qweqwe Q3: What did you do to ensure data accuracy ? Q4: What is technical challengne you face ? Q5: How did you fix a bug in production ? What did you do to solve it ?... ]]></description>
    <pubDate>Mon, 18 May 2026 15:59:31 GMT</pubDate>
  </item><item>
    <title>Postgres</title>
    <link>https://blog.nhoxanboc.work/Data/postgres</link>
    <guid>https://blog.nhoxanboc.work/Data/postgres</guid>
    <description><![CDATA[ PostgreSQL — Sone My Notes Table of Contents Index Types Transaction Isolation Levels &amp; Phantom Reads Query Planning MVCC — xmin, xmax, and Dead Tuples VACUUM Heap &amp; Bitmap Index Scan JOIN Types &amp; Best Practices PostgreSQL vs MySQL vs MS SQL Server 1. ]]></description>
    <pubDate>Tue, 12 May 2026 15:09:17 GMT</pubDate>
  </item><item>
    <title>Databrick</title>
    <link>https://blog.nhoxanboc.work/databrick</link>
    <guid>https://blog.nhoxanboc.work/databrick</guid>
    <description><![CDATA[  ]]></description>
    <pubDate>Tue, 12 May 2026 15:09:17 GMT</pubDate>
  </item><item>
    <title>dbt</title>
    <link>https://blog.nhoxanboc.work/dbt</link>
    <guid>https://blog.nhoxanboc.work/dbt</guid>
    <description><![CDATA[  ]]></description>
    <pubDate>Tue, 12 May 2026 15:09:17 GMT</pubDate>
  </item><item>
    <title>AWS Aurora</title>
    <link>https://blog.nhoxanboc.work/path-to-AWS-DEA/aws_aurora</link>
    <guid>https://blog.nhoxanboc.work/path-to-AWS-DEA/aws_aurora</guid>
    <description><![CDATA[  ]]></description>
    <pubDate>Tue, 12 May 2026 15:09:17 GMT</pubDate>
  </item><item>
    <title>ElasticSearch</title>
    <link>https://blog.nhoxanboc.work/elastic_search</link>
    <guid>https://blog.nhoxanboc.work/elastic_search</guid>
    <description><![CDATA[  ]]></description>
    <pubDate>Sat, 09 May 2026 14:32:39 GMT</pubDate>
  </item>
    </channel>
  </rss>