diff --git a/.DS_Store b/.DS_Store
new file mode 100644
index 0000000..2a847af
Binary files /dev/null and b/.DS_Store differ
diff --git a/fa-etl.py b/fa-etl.py
index e86350e..bbe640a 100644
--- a/fa-etl.py
+++ b/fa-etl.py
@@ -10,6 +10,13 @@ def mem_profile() -> str:
     mem_use = str(round(100 - psutil.virtual_memory().percent,4))+'% of '+str(round(psutil.virtual_memory().total/1e+9,3))+' GB RAM'
     return mem_use
 
+def is_lazydataframe_empty(ldf):
+    """
+    Checks if a polars lazy dataframe is empty given a lazy dataframe.
+    Returns: boolean (True, False)
+    """
+    return ((ldf.describe().filter(pl.col("statistic") == "count")["PropertyID"])[0] == 0)
+
 def convert_sales(filename, input_dir):
     '''
     Convert zipped txt sales (deed) file into parquet format.
@@ -266,6 +273,8 @@ def convert_valhist(filename, input_dir):
     input_filepath = input_dir + "/raw/" + filename
     output_dir = input_dir + "/" + "staging"
     output_filepath = output_dir + "/" + filename.replace(".txt.zip", ".parquet")
+    output_filepath_temp1 = output_dir + "/rankedtemp1_" + filename.replace(".txt.zip", ".parquet")
+    output_filepath_temp2 = output_dir + "/rankedtemp2_" + filename.replace(".txt.zip", ".parquet")
     output_filepath_ranked = output_dir + "/ranked_" + filename.replace(".txt.zip", ".parquet")
 
     # check if parquet already exists, if it does, skip
@@ -303,7 +312,7 @@ def convert_valhist(filename, input_dir):
         logging.info(f"{output_filepath} already exists. Moving on...")
 
     if not os.path.exists(output_filepath_ranked):
-        logging.info(f"Creating {output_filepath_ranked}...")
+        logging.info(f"Creating {output_filepath_temp1}...")
 
         #temp filepaths
         assd_filepath = output_dir+"/assd.parquet"
@@ -312,11 +321,7 @@ def convert_valhist(filename, input_dir):
         logging.info(f"filepaths: {assd_filepath}, {market_filepath} and {appr_filepath}...")
 
         if not os.path.exists(assd_filepath) & os.path.exists(market_filepath) & os.path.exists(appr_filepath):
-
             logging.info(f"Creating assd parquet...")
-            #split val hist into three separate datasets with PropertyID, Year as consistent
-            ##TODO: this seems super repetitive, but it might be the best option given the size of the dataset.
-
             (pl.scan_parquet(Path(output_filepath), low_memory = True, use_statistics=True, hive_partitioning=True)
                 .with_columns([pl.col('AssdYear').cast(pl.Int64).alias('Year')])
                 .filter(
@@ -342,9 +347,10 @@ def convert_valhist(filename, input_dir):
 
         #write checks - make sure there are no duplicates in the above (by propID/year)
             # if so, raise error and don't proceed
-        assd = pl.scan_parquet(Path(assd_filepath), low_memory = True, parallel='auto')
-        appr = pl.scan_parquet(Path(appr_filepath), low_memory = True, parallel='auto')
-        market = pl.scan_parquet(Path(market_filepath), low_memory = True, parallel='auto')
+
+        assd = pl.scan_parquet(Path(assd_filepath), low_memory = True)
+        appr = pl.scan_parquet(Path(appr_filepath), low_memory = True)
+        market = pl.scan_parquet(Path(market_filepath), low_memory = True)
 
         logging.info(f"Joining assessed values and market values on propid/year...")
         # join with market data
@@ -352,40 +358,40 @@ def convert_valhist(filename, input_dir):
             other=market,
             how="left",
             on=['PropertyID', 'Year'],
-        ).sink_parquet(Path(output_filepath_ranked), compression="snappy")
-
+        ).sink_parquet(Path(output_filepath_temp1), compression="snappy")
 
         logging.info(f"val/market join on propid/year complete. Starting second join...")
 
+        rankedtemp1_valhist = pl.scan_parquet(Path(output_filepath_temp1), low_memory = True)
+        logging.info(f"is ranked_valhist empty? {is_lazydataframe_empty(rankedtemp1_valhist)}")
+        
         # check if the length of the output of a ldf is 0 (aka dataframe is empty)
         logging.info(f"Check if appraisal dataframe is empty...")
-        if (appr.describe().filter(pl.col("statistic") == "count")["PropertyID"])[0] != 0:
+        if not is_lazydataframe_empty(appr):
             logging.info(f"Appraisal dataframe is not empty! Joining with val/market...")
-
-            (pl.scan_parquet(Path(output_filepath_ranked), low_memory = True, parallel='row_groups', use_statistics=False, hive_partitioning=False)
+            (rankedtemp1_valhist
                 # # join with appr data
                 ).join(
                     other=appr,
                     how="left",
                     on=['PropertyID', 'Year'],
                 ).sink_parquet(
-                Path(output_filepath_ranked), 
+                Path(output_filepath_temp2), 
                 compression="snappy"
             )
-        else:
+        else:    
             logging.info(f"Appraisal dataframe is empty! Adding a col of nulls for appraisal col...")
-            (pl.scan_parquet(Path(output_filepath_ranked), low_memory = True, parallel='row_groups', use_statistics=False, hive_partitioning=False)
-                # # join with appr data
+            (rankedtemp1_valhist
+                # add col of nulls for ApprTotalValue because not present for any PropIDs
                 ).with_columns([
-                    # add col of nulls for ApprTotalValue because not present for any PropIDs
                     pl.when(True).then(None).alias("ApprTotalValue")
                 ]).sink_parquet(
-                Path(output_filepath_ranked), 
+                Path(output_filepath_temp2), 
                 compression="snappy"
             )
 
         logging.info(f"val/market/appr join on propid/year complete. Doing with_cols operations...")
-        (pl.scan_parquet(Path(output_filepath_ranked), low_memory = True, parallel='row_groups', use_statistics=False, hive_partitioning=False)
+        (pl.scan_parquet(Path(output_filepath_temp2), low_memory = True)
             .with_columns([
                 #value conditional
                 pl.when((pl.col("AssdTotalValue").is_not_null()) & (pl.col("AssdTotalValue") != 0))
diff --git a/scratch.ipynb b/scratch.ipynb
index efd9477..d44198f 100644
--- a/scratch.ipynb
+++ b/scratch.ipynb
@@ -2,18 +2,9 @@
  "cells": [
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 1,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "The autoreload extension is already loaded. To reload it, use:\n",
-      "  %reload_ext autoreload\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "#set up autoreload\n",
     "%load_ext autoreload\n",
@@ -28,7 +19,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 69,
+   "execution_count": 9,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -49,7 +40,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 70,
+   "execution_count": 10,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -57,184 +48,134 @@
     "    other=market,\n",
     "    how=\"left\",\n",
     "    on=['PropertyID', 'Year'],\n",
-    ").sink_parquet(Path(output_filepath_ranked), compression=\"snappy\")\n"
+    ").sink_parquet(Path(output_filepath_ranked), compression=\"snappy\")"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 71,
+   "execution_count": 12,
    "metadata": {},
    "outputs": [],
    "source": [
-    "valhist = pl.read_parquet(path_to_dir+f\"dev/{county}/staging/ranked_ValHist{county}.parquet\")"
+    "ranked_valhist = pl.read_parquet(path_to_dir+f\"dev/{county}/staging/ranked_ValHist{county}.parquet\")"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 72,
+   "execution_count": 22,
    "metadata": {},
    "outputs": [
     {
      "data": {
       "text/plain": [
-       "(3566623, 4)"
+       "False"
       ]
      },
-     "execution_count": 72,
+     "execution_count": 22,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "valhist.shape"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 43,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "lf = pl.LazyFrame(\n",
-    "    {\n",
-    "        \"a\": [1, 2, 3, 4],\n",
-    "        \"b\": [0.5, 4, 10, 13],\n",
-    "        \"c\": [True, True, False, True],\n",
-    "    }\n",
-    ")"
+    "fa_etl.is_lazydataframe_empty(path_to_dir+f\"dev/{county}/staging/ranked_ValHist{county}.parquet\")"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 56,
+   "execution_count": 23,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/html": [
-       "<div><style>\n",
-       ".dataframe > thead > tr,\n",
-       ".dataframe > tbody > tr {\n",
-       "  text-align: right;\n",
-       "  white-space: pre-wrap;\n",
-       "}\n",
-       "</style>\n",
-       "<small>shape: (4, 4)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>a</th><th>b</th><th>c</th><th>Appr</th></tr><tr><td>i64</td><td>f64</td><td>bool</td><td>null</td></tr></thead><tbody><tr><td>1</td><td>0.5</td><td>true</td><td>null</td></tr><tr><td>2</td><td>4.0</td><td>true</td><td>null</td></tr><tr><td>3</td><td>10.0</td><td>false</td><td>null</td></tr><tr><td>4</td><td>13.0</td><td>true</td><td>null</td></tr></tbody></table></div>"
-      ],
       "text/plain": [
-       "shape: (4, 4)\n",
-       "┌─────┬──────┬───────┬──────┐\n",
-       "│ a   ┆ b    ┆ c     ┆ Appr │\n",
-       "│ --- ┆ ---  ┆ ---   ┆ ---  │\n",
-       "│ i64 ┆ f64  ┆ bool  ┆ null │\n",
-       "╞═════╪══════╪═══════╪══════╡\n",
-       "│ 1   ┆ 0.5  ┆ true  ┆ null │\n",
-       "│ 2   ┆ 4.0  ┆ true  ┆ null │\n",
-       "│ 3   ┆ 10.0 ┆ false ┆ null │\n",
-       "│ 4   ┆ 13.0 ┆ true  ┆ null │\n",
-       "└─────┴──────┴───────┴──────┘"
+       "(3566623, 4)"
       ]
      },
-     "execution_count": 56,
+     "execution_count": 23,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "lf.with_columns([\n",
-    "    pl.when(True).then(None).alias(\"ApprTotalValue\")\n",
-    "]).collect()"
+    "ranked_valhist.shape"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 12,
+   "execution_count": 8,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/html": [
-       "<div><style>\n",
-       ".dataframe > thead > tr,\n",
-       ".dataframe > tbody > tr {\n",
-       "  text-align: right;\n",
-       "  white-space: pre-wrap;\n",
-       "}\n",
-       "</style>\n",
-       "<small>shape: (0, 16)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>PropertyID</th><th>SaleAmt</th><th>RecordingDate</th><th>FIPS</th><th>FATimeStamp</th><th>FATransactionID</th><th>TransactionType</th><th>SaleDate</th><th>RecordingYearSlice</th><th>PropertyID_str</th><th>FATransactionID_1</th><th>RecordingYear</th><th>SaleYear</th><th>FATimeStampYear</th><th>SaleFlag</th><th>PropIDFlag</th></tr><tr><td>i64</td><td>i64</td><td>date</td><td>str</td><td>date</td><td>i64</td><td>str</td><td>date</td><td>str</td><td>str</td><td>str</td><td>i64</td><td>i32</td><td>i32</td><td>i32</td><td>i32</td></tr></thead><tbody></tbody></table></div>"
-      ],
       "text/plain": [
-       "shape: (0, 16)\n",
-       "┌────────────┬─────────┬──────────────┬──────┬───┬──────────┬──────────────┬──────────┬────────────┐\n",
-       "│ PropertyID ┆ SaleAmt ┆ RecordingDat ┆ FIPS ┆ … ┆ SaleYear ┆ FATimeStampY ┆ SaleFlag ┆ PropIDFlag │\n",
-       "│ ---        ┆ ---     ┆ e            ┆ ---  ┆   ┆ ---      ┆ ear          ┆ ---      ┆ ---        │\n",
-       "│ i64        ┆ i64     ┆ ---          ┆ str  ┆   ┆ i32      ┆ ---          ┆ i32      ┆ i32        │\n",
-       "│            ┆         ┆ date         ┆      ┆   ┆          ┆ i32          ┆          ┆            │\n",
-       "╞════════════╪═════════╪══════════════╪══════╪═══╪══════════╪══════════════╪══════════╪════════════╡\n",
-       "└────────────┴─────────┴──────────────┴──────┴───┴──────────┴──────────────┴──────────┴────────────┘"
+       "OrderedDict([('PropertyID', Int64),\n",
+       "             ('AssdTotalValue', Int64),\n",
+       "             ('AssdYear', Int64),\n",
+       "             ('MarketTotalValue', Int64),\n",
+       "             ('MarketValueYear', Int64),\n",
+       "             ('ApprTotalValue', Int64),\n",
+       "             ('ApprYear', Int64),\n",
+       "             ('TaxableYear', Int64)])"
       ]
      },
-     "execution_count": 12,
+     "execution_count": 8,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "sales.filter(\n",
-    "    pl.col(\"PropIDFlag\") == 1\n",
-    ")"
+    "valhist.schema"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 12,
+   "execution_count": 24,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "merged = pl.read_parquet(path_to_dir+f\"dev/{county}/unified/merged.parquet\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 27,
    "metadata": {},
    "outputs": [
     {
      "data": {
       "text/html": [
        "<div><style>\n",
-       ".dataframe > thead > tr > th,\n",
-       ".dataframe > tbody > tr > td {\n",
+       ".dataframe > thead > tr,\n",
+       ".dataframe > tbody > tr {\n",
        "  text-align: right;\n",
        "  white-space: pre-wrap;\n",
        "}\n",
        "</style>\n",
-       "<small>shape: (44_004, 8)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>PropertyID</th><th>Year</th><th>Value</th><th>AssessmentUsed</th><th>SaleAmt</th><th>TaxAmt</th><th>TaxAmtAdjusted</th><th>ApproxTaxRate</th></tr><tr><td>i64</td><td>i64</td><td>i64</td><td>str</td><td>i64</td><td>i64</td><td>f64</td><td>f64</td></tr></thead><tbody><tr><td>91847870</td><td>2018</td><td>117677</td><td>&quot;Assd&quot;</td><td>1580000</td><td>1310424</td><td>13104.24</td><td>11.13577</td></tr><tr><td>91849008</td><td>2018</td><td>247162</td><td>&quot;Assd&quot;</td><td>4400000</td><td>3114052</td><td>31140.52</td><td>12.599235</td></tr><tr><td>91848046</td><td>2018</td><td>71155</td><td>&quot;Assd&quot;</td><td>712775</td><td>773352</td><td>7733.52</td><td>10.868555</td></tr><tr><td>91846549</td><td>2018</td><td>149310</td><td>&quot;Assd&quot;</td><td>2475000</td><td>1527372</td><td>15273.72</td><td>10.229536</td></tr><tr><td>91847537</td><td>2018</td><td>128574</td><td>&quot;Assd&quot;</td><td>1625000</td><td>1496148</td><td>14961.48</td><td>11.636474</td></tr><tr><td>91848333</td><td>2018</td><td>356895</td><td>&quot;Assd&quot;</td><td>7400000</td><td>3958776</td><td>39587.76</td><td>11.092271</td></tr><tr><td>91846649</td><td>2018</td><td>219589</td><td>&quot;Assd&quot;</td><td>3100000</td><td>2518932</td><td>25189.32</td><td>11.471121</td></tr><tr><td>91847215</td><td>2018</td><td>299300</td><td>&quot;Assd&quot;</td><td>2825000</td><td>3327036</td><td>33270.36</td><td>11.116057</td></tr><tr><td>91846134</td><td>2022</td><td>718067</td><td>&quot;Assd&quot;</td><td>12500000</td><td>8808528</td><td>88085.28</td><td>12.267</td></tr><tr><td>91847289</td><td>2018</td><td>143322</td><td>&quot;Assd&quot;</td><td>2840000</td><td>1723200</td><td>17232.0</td><td>12.023276</td></tr><tr><td>91848235</td><td>2018</td><td>98891</td><td>&quot;Assd&quot;</td><td>840000</td><td>1074844</td><td>10748.44</td><td>10.868977</td></tr><tr><td>91847234</td><td>2018</td><td>97929</td><td>&quot;Assd&quot;</td><td>2000000</td><td>1138124</td><td>11381.24</td><td>11.62193</td></tr><tr><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td></tr><tr><td>91951526</td><td>2020</td><td>43461</td><td>&quot;Assd&quot;</td><td>280000</td><td>null</td><td>null</td><td>null</td></tr><tr><td>91950328</td><td>2020</td><td>791550</td><td>&quot;Assd&quot;</td><td>12000000</td><td>null</td><td>null</td><td>null</td></tr><tr><td>91951497</td><td>2023</td><td>388800</td><td>&quot;Assd&quot;</td><td>2613000</td><td>4860778</td><td>48607.78</td><td>12.502001</td></tr><tr><td>91951494</td><td>2023</td><td>423000</td><td>&quot;Assd&quot;</td><td>2321000</td><td>5288346</td><td>52883.46</td><td>12.502</td></tr><tr><td>91951499</td><td>2023</td><td>376200</td><td>&quot;Assd&quot;</td><td>2566000</td><td>4703252</td><td>47032.52</td><td>12.501999</td></tr><tr><td>91951505</td><td>2023</td><td>418950</td><td>&quot;Assd&quot;</td><td>1942000</td><td>5237713</td><td>52377.13</td><td>12.502</td></tr><tr><td>91951508</td><td>2023</td><td>418950</td><td>&quot;Assd&quot;</td><td>2795000</td><td>5237713</td><td>52377.13</td><td>12.502</td></tr><tr><td>91950049</td><td>2023</td><td>88208</td><td>&quot;Assd&quot;</td><td>580000</td><td>1102776</td><td>11027.76</td><td>12.501995</td></tr><tr><td>91950055</td><td>2023</td><td>90672</td><td>&quot;Assd&quot;</td><td>570000</td><td>1133581</td><td>11335.81</td><td>12.501996</td></tr><tr><td>91949993</td><td>2023</td><td>30010</td><td>&quot;Assd&quot;</td><td>550000</td><td>375185</td><td>3751.85</td><td>12.501999</td></tr><tr><td>91950231</td><td>2023</td><td>30130</td><td>&quot;Assd&quot;</td><td>4601351</td><td>376685</td><td>3766.85</td><td>12.501991</td></tr><tr><td>91951304</td><td>2023</td><td>36494</td><td>&quot;Assd&quot;</td><td>971562</td><td>704863</td><td>7048.63</td><td>19.31449</td></tr></tbody></table></div>"
+       "<small>shape: (5, 17)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>PropertyID</th><th>Year</th><th>Value</th><th>MarketTotalValue</th><th>ApprTotalValue</th><th>SitusLatitude</th><th>SitusLongitude</th><th>SitusFullStreetAddress</th><th>SitusCity</th><th>SitusState</th><th>SitusZIP5</th><th>FIPS</th><th>SitusCensusTract</th><th>SitusCensusBlock</th><th>SaleAmt</th><th>TaxAmt</th><th>TaxAmtAdjusted</th></tr><tr><td>i64</td><td>i64</td><td>i64</td><td>i64</td><td>null</td><td>f64</td><td>f64</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>i64</td><td>i64</td><td>f64</td></tr></thead><tbody><tr><td>91847870</td><td>2018</td><td>117677</td><td>261504</td><td>null</td><td>40.750965</td><td>-73.982198</td><td>&quot;425 5TH AVE AP…</td><td>&quot;NEW YORK&quot;</td><td>&quot;NY&quot;</td><td>&quot;10016&quot;</td><td>&quot;36061&quot;</td><td>&quot;008200&quot;</td><td>&quot;2004&quot;</td><td>1580000</td><td>1310424</td><td>13104.24</td></tr><tr><td>91849008</td><td>2018</td><td>247162</td><td>1462000</td><td>null</td><td>40.750447</td><td>-73.997723</td><td>&quot;362 W 30TH ST&quot;</td><td>&quot;NEW YORK&quot;</td><td>&quot;NY&quot;</td><td>&quot;10001&quot;</td><td>&quot;36061&quot;</td><td>&quot;009700&quot;</td><td>&quot;4000&quot;</td><td>4400000</td><td>3114052</td><td>31140.52</td></tr><tr><td>91848046</td><td>2018</td><td>71155</td><td>158123</td><td>null</td><td>40.738643</td><td>-73.987954</td><td>&quot;254 PARK AVE S…</td><td>&quot;NEW YORK&quot;</td><td>&quot;NY&quot;</td><td>&quot;10010&quot;</td><td>&quot;36061&quot;</td><td>&quot;005200&quot;</td><td>&quot;1000&quot;</td><td>712775</td><td>773352</td><td>7733.52</td></tr><tr><td>91846549</td><td>2018</td><td>149310</td><td>331800</td><td>null</td><td>40.729262</td><td>-74.004785</td><td>&quot;63 DOWNING ST …</td><td>&quot;NEW YORK&quot;</td><td>&quot;NY&quot;</td><td>&quot;10014&quot;</td><td>&quot;36061&quot;</td><td>&quot;006700&quot;</td><td>&quot;2002&quot;</td><td>2475000</td><td>1527372</td><td>15273.72</td></tr><tr><td>91847537</td><td>2018</td><td>128574</td><td>285721</td><td>null</td><td>40.73889</td><td>-73.987904</td><td>&quot;260 PARK AVE S…</td><td>&quot;NEW YORK&quot;</td><td>&quot;NY&quot;</td><td>&quot;10010&quot;</td><td>&quot;36061&quot;</td><td>&quot;005200&quot;</td><td>&quot;1000&quot;</td><td>1625000</td><td>1496148</td><td>14961.48</td></tr></tbody></table></div>"
       ],
       "text/plain": [
-       "shape: (44_004, 8)\n",
-       "┌────────────┬──────┬────────┬────────────────┬─────────┬─────────┬────────────────┬───────────────┐\n",
-       "│ PropertyID ┆ Year ┆ Value  ┆ AssessmentUsed ┆ SaleAmt ┆ TaxAmt  ┆ TaxAmtAdjusted ┆ ApproxTaxRate │\n",
-       "│ ---        ┆ ---  ┆ ---    ┆ ---            ┆ ---     ┆ ---     ┆ ---            ┆ ---           │\n",
-       "│ i64        ┆ i64  ┆ i64    ┆ str            ┆ i64     ┆ i64     ┆ f64            ┆ f64           │\n",
-       "╞════════════╪══════╪════════╪════════════════╪═════════╪═════════╪════════════════╪═══════════════╡\n",
-       "│ 91847870   ┆ 2018 ┆ 117677 ┆ Assd           ┆ 1580000 ┆ 1310424 ┆ 13104.24       ┆ 11.13577      │\n",
-       "│ 91849008   ┆ 2018 ┆ 247162 ┆ Assd           ┆ 4400000 ┆ 3114052 ┆ 31140.52       ┆ 12.599235     │\n",
-       "│ 91848046   ┆ 2018 ┆ 71155  ┆ Assd           ┆ 712775  ┆ 773352  ┆ 7733.52        ┆ 10.868555     │\n",
-       "│ 91846549   ┆ 2018 ┆ 149310 ┆ Assd           ┆ 2475000 ┆ 1527372 ┆ 15273.72       ┆ 10.229536     │\n",
-       "│ …          ┆ …    ┆ …      ┆ …              ┆ …       ┆ …       ┆ …              ┆ …             │\n",
-       "│ 91950055   ┆ 2023 ┆ 90672  ┆ Assd           ┆ 570000  ┆ 1133581 ┆ 11335.81       ┆ 12.501996     │\n",
-       "│ 91949993   ┆ 2023 ┆ 30010  ┆ Assd           ┆ 550000  ┆ 375185  ┆ 3751.85        ┆ 12.501999     │\n",
-       "│ 91950231   ┆ 2023 ┆ 30130  ┆ Assd           ┆ 4601351 ┆ 376685  ┆ 3766.85        ┆ 12.501991     │\n",
-       "│ 91951304   ┆ 2023 ┆ 36494  ┆ Assd           ┆ 971562  ┆ 704863  ┆ 7048.63        ┆ 19.31449      │\n",
-       "└────────────┴──────┴────────┴────────────────┴─────────┴─────────┴────────────────┴───────────────┘"
+       "shape: (5, 17)\n",
+       "┌────────────┬──────┬────────┬───────────────┬───┬──────────────┬─────────┬─────────┬──────────────┐\n",
+       "│ PropertyID ┆ Year ┆ Value  ┆ MarketTotalVa ┆ … ┆ SitusCensusB ┆ SaleAmt ┆ TaxAmt  ┆ TaxAmtAdjust │\n",
+       "│ ---        ┆ ---  ┆ ---    ┆ lue           ┆   ┆ lock         ┆ ---     ┆ ---     ┆ ed           │\n",
+       "│ i64        ┆ i64  ┆ i64    ┆ ---           ┆   ┆ ---          ┆ i64     ┆ i64     ┆ ---          │\n",
+       "│            ┆      ┆        ┆ i64           ┆   ┆ str          ┆         ┆         ┆ f64          │\n",
+       "╞════════════╪══════╪════════╪═══════════════╪═══╪══════════════╪═════════╪═════════╪══════════════╡\n",
+       "│ 91847870   ┆ 2018 ┆ 117677 ┆ 261504        ┆ … ┆ 2004         ┆ 1580000 ┆ 1310424 ┆ 13104.24     │\n",
+       "│ 91849008   ┆ 2018 ┆ 247162 ┆ 1462000       ┆ … ┆ 4000         ┆ 4400000 ┆ 3114052 ┆ 31140.52     │\n",
+       "│ 91848046   ┆ 2018 ┆ 71155  ┆ 158123        ┆ … ┆ 1000         ┆ 712775  ┆ 773352  ┆ 7733.52      │\n",
+       "│ 91846549   ┆ 2018 ┆ 149310 ┆ 331800        ┆ … ┆ 2002         ┆ 2475000 ┆ 1527372 ┆ 15273.72     │\n",
+       "│ 91847537   ┆ 2018 ┆ 128574 ┆ 285721        ┆ … ┆ 1000         ┆ 1625000 ┆ 1496148 ┆ 14961.48     │\n",
+       "└────────────┴──────┴────────┴───────────────┴───┴──────────────┴─────────┴─────────┴──────────────┘"
       ]
      },
-     "execution_count": 12,
+     "execution_count": 27,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "merged.filter([\n",
-    "    pl.col(\"SaleAmt\").is_not_null(),\n",
-    "    pl.col(\"Year\") > 2017\n",
-    "]).select(\n",
-    "    ['PropertyID','Year','Value','AssessmentUsed','SaleAmt', 'TaxAmt', 'TaxAmtAdjusted']\n",
-    ").with_columns([\n",
-    "    (pl.col('TaxAmt')/pl.col('Value')).alias(\"ApproxTaxRate\")\n",
-    "])"
+    "merged.head()"
    ]
   }
  ],