<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url>
<loc>https://dorianbg.github.io/posts/gsoc-community-bonding-week-1/</loc>
<lastmod>2017-05-21T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-community-bonding-week-2/</loc>
<lastmod>2017-05-21T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-community-bonding-week-3/</loc>
<lastmod>2017-05-26T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/detailed-plans-for-my-gsoc-project/</loc>
<lastmod>2017-05-31T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-week-1/</loc>
<lastmod>2017-06-01T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-week-2/</loc>
<lastmod>2017-06-08T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/how-to-fix-task-not-serializable-issues-in-apache-spark/</loc>
<lastmod>2024-01-19T21:37:38+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-week-3/</loc>
<lastmod>2017-06-15T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/get-spark-clasifier-metrics-using-the-confusion-matrix/</loc>
<lastmod>2024-01-19T21:37:38+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-week-4/</loc>
<lastmod>2017-06-22T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-week-5/</loc>
<lastmod>2017-06-29T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-week-6/</loc>
<lastmod>2017-07-06T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-week-7/</loc>
<lastmod>2017-07-13T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-week-8/</loc>
<lastmod>2017-07-20T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-week-9/</loc>
<lastmod>2017-07-26T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-week-10/</loc>
<lastmod>2017-08-03T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-week-11/</loc>
<lastmod>2017-08-10T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-week-12/</loc>
<lastmod>2017-08-18T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-week-13/</loc>
<lastmod>2017-08-25T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/google-summer-of-code-2017-summary/</loc>
<lastmod>2017-08-26T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/gsoc-weekly-posts-summary/</loc>
<lastmod>2017-08-27T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/spark-vs-pandas-benchmark-why-you-should-use-spark-only-with-really-big-data/</loc>
<lastmod>2024-01-19T20:58:25+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/sql-server-security-basics-logins-and-users/</loc>
<lastmod>2024-01-19T21:37:38+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/advanced-data-analysis-for-cbioportal/</loc>
<lastmod>2017-09-24T00:00:00+01:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/window-functions/</loc>
<lastmod>2024-01-19T21:37:38+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/windows-functions-in-postgresql/</loc>
<lastmod>2024-01-19T21:37:38+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/introduction-to-lambda-architecture/</loc>
<lastmod>2024-02-03T19:22:55+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/building-the-batch-layer-of-lambda-architecture-using-s3-redshift-and-apache-kafka/</loc>
<lastmod>2024-02-03T19:22:55+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/building-the-serving-layer-of-lambda-architecture-using-redshift/</loc>
<lastmod>2024-02-03T19:22:55+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/building-the-speed-layer-of-lambda-architecture-using-structured-spark-streaming/</loc>
<lastmod>2024-02-03T19:22:55+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/ingesting-realtime-tweets-using-apache-kafka-tweepy-and-python/</loc>
<lastmod>2024-02-03T19:22:55+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/apache-airflow-for-data-pipelines/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/detailed-coverage-of-window-functions-on-snowflake/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/writing-udafs-on-snowflake/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/advanced-spark-structured-streaming-aggregations-joins-checkpointing/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/clustering-keys-snowflake/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/using-spark-structured-streaming-to-upsert-kafka-messages-into-a-database/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/caching-in-snowflake-data-warehouse/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/my-favorite-features-of-snowflake-data-warehouse/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/loading-data-into-snowflake-data-warehouse-and-performance-of-joins/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/my-blog-posts-for-sonra-intelligence/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/apache-spark-presentation/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/development-for-aws/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/how-get-into-top-30-of-house-prices-advanced-regression-kaggle-competition-with-50-lines-of-code/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/envoy-proxy-and-modern-load-balancing/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/playing-with-pg_auto_failover/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/my-view-on-responsibilities-of-a-modern-data-engineer/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/kubernetes-auto-scaling-on-relative-resource-usage/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/data-extraction-and-transformation-design-patterns/</loc>
<lastmod>2024-01-30T23:10:08+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/data-pipeline-design-anti-patterns/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/general-guidelines-for-design-of-batch-jobs/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/important-skills-for-data-engineers/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/modern-data-engineering-stack/</loc>
<lastmod>2024-01-20T12:39:04+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/my-favourite-papers-on-columnar-databases/</loc>
<lastmod>2023-03-18T00:00:00+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/python-tips/</loc>
<lastmod>2024-01-20T10:00:00+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/nginx-vs-haproxy-vs-envoy/</loc>
<lastmod>2024-01-21T09:46:09+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/python-project-setup-best-practice/</loc>
<lastmod>2024-02-10T21:18:50+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/posts/duckdb-postgres-dbt/</loc>
<lastmod>2024-03-03T13:00:13+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/categories/</loc>
<lastmod>2024-03-03T13:00:32+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/tags/</loc>
<lastmod>2024-03-03T13:00:32+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/books/</loc>
<lastmod>2024-03-03T13:00:32+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/about/</loc>
<lastmod>2024-03-03T13:00:32+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/archives/</loc>
<lastmod>2024-03-03T13:00:32+00:00</lastmod>
</url>
<url>
<loc>https://dorianbg.github.io/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/airflow/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/snowflake/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/sql/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/spark/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/kafka/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/aws/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/envoy/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/ha-proxy/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/nginx/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/high-availability/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/postgresql/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/principles/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/kubernetes/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/python/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/duckdb/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/tags/dbt/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/categories/google-summer-of-code/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/categories/data-engineering/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/categories/data-science/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/categories/sql/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/categories/databases/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/categories/cloud/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/categories/software-development/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/categories/load-balancers/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/page2/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/page3/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/page4/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/page5/</loc>
</url>
<url>
<loc>https://dorianbg.github.io/page6/</loc>
</url>
</urlset>
