diff --git a/.gitignore b/.gitignore
index e820538..764d297 100644
--- a/.gitignore
+++ b/.gitignore
@@ -7,4 +7,5 @@ draft*.ipynb
 *.old
 .env
 getting-started/my_nma_dataset.csv
-*.sqlite
\ No newline at end of file
+*.sqlite
+anzac-day
\ No newline at end of file
diff --git a/.zenodo.json b/.zenodo.json
index b5e51f4..611da2f 100644
--- a/.zenodo.json
+++ b/.zenodo.json
@@ -5,7 +5,7 @@
   "related_identifiers": [
     {
       "scheme": "url",
-      "identifier": "https://github.com/GLAM-Workbench/trove-newspaper-harvester/tree/v1.2.2",
+      "identifier": "https://github.com/GLAM-Workbench/trove-newspaper-harvester/tree/v1.3.0",
       "relation": "isDerivedFrom",
       "resource_type": "software"
     },
@@ -28,7 +28,7 @@
       "resource_type": "other"
     }
   ],
-  "version": "v1.2.2",
+  "version": "v1.3.0",
   "upload_type": "software",
   "keywords": [
     "Trove",
@@ -36,7 +36,7 @@
     "Jupyter",
     "GLAM Workbench"
   ],
-  "publication_date": "2022-10-11",
+  "publication_date": "2023-03-16",
   "creators": [
     {
       "orcid": "0000-0001-7956-4498",
@@ -44,5 +44,5 @@
     }
   ],
   "access_right": "open",
-  "description": "<p>Current version: <a href=\"https://github.com/GLAM-Workbench/trove-newspaper-harvester/releases/tag/v1.2.2\">v1.2.2</a></p> <p>The <a href=\"https://pypi.org/project/trove-newspaper-harvester/\">Trove Newspaper &amp; Gazette Harvester Harvester</a> makes it easy to download large quantities of digitised articles from Trove’s newspapers and gazettes. Just give it a search from the Trove web interface, and the harvester will save the metadata of all the articles in a CSV (spreadsheet) file for further analysis. You can also save the full text of every article, as well as copies of the articles as JPG images, and even PDFs. While the web interface will only show you the first 2,000 results matching your search, the Newspaper &amp; Gazette Harvester will get <strong>everything</strong>.</p> <p>The Jupyter notebooks in this repository use the Trove Newspaper and Gazette Harvester to download large quantities of digitised newspaper articles from Trove. There’s also a few examples of how you can analyse and explore the harvested data.</p> <p>The notebooks include:</p> <ul> <li><strong>Using TroveHarvester to get newspaper articles in bulk</strong> — an easy introduction to the TroveHarvester tool</li> <li><strong>Trove Harvester web app</strong> — a simple web interface to the TroveHarvester, the easiest way to harvest data from Trove (runs in Voila)</li> <li><strong>Display the results of a harvest as a searchable database using Datasette</strong> – load your harvested data into a SQLite database and explore it using Datasette</li> <li><strong>Exploring your TroveHarvester data</strong> — use Pandas to analyse your data and create some visualisations</li> <li><strong>Explore harvested text files</strong> (experimental) — analyse the full text content of harvested articles</li> </ul> <p>See the <a href=\"https://glam-workbench.github.io/trove-harvester/\">GLAM Workbench for more details</a>.</p> <h2 id=\"cite-as\">Cite as</h2> <p>See the GLAM Workbench or <a href=\"https://doi.org/10.5281/zenodo.3545044\">Zenodo</a> for up-to-date citation details.</p> <hr /> <p>This repository is part of the <a href=\"https://glam-workbench.github.io/\">GLAM Workbench</a>.<br /> If you think this project is worthwhile, you might like <a href=\"https://github.com/sponsors/wragge?o=esb\">to sponsor me on GitHub</a>.</p>"
+  "description": "<p>Current version: <a href=\"https://github.com/GLAM-Workbench/trove-newspaper-harvester/releases/tag/v1.3.0\">v1.3.0</a></p> <p>The <a href=\"https://pypi.org/project/trove-newspaper-harvester/\">Trove Newspaper &amp; Gazette Harvester Harvester</a> makes it easy to download large quantities of digitised articles from Trove’s newspapers and gazettes. Just give it a search from the Trove web interface, and the harvester will save the metadata of all the articles in a CSV (spreadsheet) file for further analysis. You can also save the full text of every article, as well as copies of the articles as JPG images, and even PDFs. While the web interface will only show you the first 2,000 results matching your search, the Newspaper &amp; Gazette Harvester will get <strong>everything</strong>.</p> <p>The Jupyter notebooks in this repository use the Trove Newspaper and Gazette Harvester to download large quantities of digitised newspaper articles from Trove. There’s also a few examples of how you can analyse and explore the harvested data.</p> <p>The notebooks include:</p> <ul> <li><strong>Using TroveHarvester to get newspaper articles in bulk</strong> — an easy introduction to the TroveHarvester tool</li> <li><strong>Trove Harvester web app</strong> — a simple web interface to the TroveHarvester, the easiest way to harvest data from Trove (runs in Voila)</li> <li><strong>Display the results of a harvest as a searchable database using Datasette</strong> – load your harvested data into a SQLite database and explore it using Datasette</li> <li><strong>Exploring your TroveHarvester data</strong> — use Pandas to analyse your data and create some visualisations</li> <li><strong>Explore harvested text files</strong> (experimental) — analyse the full text content of harvested articles</li> </ul> <p>See the <a href=\"https://glam-workbench.github.io/trove-harvester/\">GLAM Workbench for more details</a>.</p> <h2 id=\"cite-as\">Cite as</h2> <p>See the GLAM Workbench or <a href=\"https://doi.org/10.5281/zenodo.3545044\">Zenodo</a> for up-to-date citation details.</p> <hr /> <p>This repository is part of the <a href=\"https://glam-workbench.github.io/\">GLAM Workbench</a>.<br /> If you think this project is worthwhile, you might like <a href=\"https://github.com/sponsors/wragge?o=esb\">to sponsor me on GitHub</a>.</p>"
 }
diff --git a/README.md b/README.md
index 4a9c316..d4ef616 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,6 @@
 # Trove Newspaper and Gazette Harvester
 
-Current version: [v1.2.2](https://github.com/GLAM-Workbench/trove-newspaper-harvester/releases/tag/v1.2.2)
+Current version: [v1.3.0](https://github.com/GLAM-Workbench/trove-newspaper-harvester/releases/tag/v1.3.0)
 
 The [Trove Newspaper & Gazette Harvester Harvester](https://pypi.org/project/trove-newspaper-harvester/) makes it easy to download large quantities of digitised articles from Trove's newspapers and gazettes. Just give it a search from the Trove web interface, and the harvester will save the metadata of all the articles in a CSV (spreadsheet) file for further analysis. You can also save the full text of every article, as well as copies of the articles as JPG images, and even PDFs. While the web interface will only show you the first 2,000 results matching your search, the Newspaper & Gazette Harvester will get **everything**.
 
diff --git a/harvest-specific-days.ipynb b/harvest-specific-days.ipynb
new file mode 100644
index 0000000..c1083d8
--- /dev/null
+++ b/harvest-specific-days.ipynb
@@ -0,0 +1,537 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "a2cca763-3b3e-42a6-9381-c9478d574abd",
+   "metadata": {},
+   "source": [
+    "# Harvesting articles that mention \"Anzac Day\" on Anzac Day\n",
+    "\n",
+    "The Trove Newspaper Harvester web app and command-line tool make it easy for you to harvest the results of a single search. But if you want to harvest very large or complex searches, you might find it easier to import the `trove_newspaper_harvester` library directly and take control of the harvesting process.\n",
+    "\n",
+    "For example, how would you harvest all of the newspaper articles mentioning \"Anzac Day\" that were published *on* Anzac Day, 25 April? It's possible to search for results from a single day using the `date` index. So, theoretically, you could combine multiple dates using `OR` and build a very long search query by doing something like this:\n",
+    "\n",
+    "``` python\n",
+    "days = []\n",
+    "for year in range(1916, 1955):\n",
+    "    days.append(f\"date:[{year}-04-24T00:00:00Z TO {year}-04-25T00:00:00Z]\")\n",
+    "query_string = f'\"anzac day\" AND ({\" OR \".join(days)})'\n",
+    "```\n",
+    "\n",
+    "However, if you try searching in Trove using the query string generated by this code it [returns no results](https://trove.nla.gov.au/search/category/newspapers?keyword=%22anzac%20day%22%20AND%20%28date%3A%5B1916-04-24T00%3A00%3A00Z%20TO%201916-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1917-04-24T00%3A00%3A00Z%20TO%201917-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1918-04-24T00%3A00%3A00Z%20TO%201918-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1919-04-24T00%3A00%3A00Z%20TO%201919-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1920-04-24T00%3A00%3A00Z%20TO%201920-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1921-04-24T00%3A00%3A00Z%20TO%201921-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1922-04-24T00%3A00%3A00Z%20TO%201922-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1923-04-24T00%3A00%3A00Z%20TO%201923-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1924-04-24T00%3A00%3A00Z%20TO%201924-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1925-04-24T00%3A00%3A00Z%20TO%201925-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1926-04-24T00%3A00%3A00Z%20TO%201926-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1927-04-24T00%3A00%3A00Z%20TO%201927-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1928-04-24T00%3A00%3A00Z%20TO%201928-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1929-04-24T00%3A00%3A00Z%20TO%201929-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1930-04-24T00%3A00%3A00Z%20TO%201930-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1931-04-24T00%3A00%3A00Z%20TO%201931-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1932-04-24T00%3A00%3A00Z%20TO%201932-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1933-04-24T00%3A00%3A00Z%20TO%201933-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1934-04-24T00%3A00%3A00Z%20TO%201934-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1935-04-24T00%3A00%3A00Z%20TO%201935-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1936-04-24T00%3A00%3A00Z%20TO%201936-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1937-04-24T00%3A00%3A00Z%20TO%201937-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1938-04-24T00%3A00%3A00Z%20TO%201938-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1939-04-24T00%3A00%3A00Z%20TO%201939-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1940-04-24T00%3A00%3A00Z%20TO%201940-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1941-04-24T00%3A00%3A00Z%20TO%201941-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1942-04-24T00%3A00%3A00Z%20TO%201942-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1943-04-24T00%3A00%3A00Z%20TO%201943-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1944-04-24T00%3A00%3A00Z%20TO%201944-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1945-04-24T00%3A00%3A00Z%20TO%201945-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1946-04-24T00%3A00%3A00Z%20TO%201946-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1947-04-24T00%3A00%3A00Z%20TO%201947-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1948-04-24T00%3A00%3A00Z%20TO%201948-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1949-04-24T00%3A00%3A00Z%20TO%201949-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1950-04-24T00%3A00%3A00Z%20TO%201950-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1951-04-24T00%3A00%3A00Z%20TO%201951-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1952-04-24T00%3A00%3A00Z%20TO%201952-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1953-04-24T00%3A00%3A00Z%20TO%201953-04-25T00%3A00%3A00Z%5D%20OR%20date%3A%5B1954-04-24T00%3A00%3A00Z%20TO%201954-04-25T00%3A00%3A00Z%5D%29). Presumably it has hit a limit on query length. But even if you reduce the span of years you can get some odd results. It seems safer to search for each day independently, but how can you do that without manually creating lots of separate harvests?\n",
+    "\n",
+    "The example below does the following:\n",
+    "\n",
+    "- imports the `trove_newspaper_harvester` `Harvester` class and `prepare_query` function\n",
+    "- uses `prepare_query` to create the basic set of parameters (without the date search)\n",
+    "- loops through the desired span of years, adding the date search to the query, initialising the `Harvester`, running the harvest, and saving the results as a CSV file\n",
+    "\n",
+    "It also uses the `data_dir` and `harvest_dir` parameters of `Harvester` to tell it where to save the results. These options help you keep related searches together. In this instance, all the searches are saved in the `anzac-day` parent directory, with each individual search saved in a directory named by the year of the search query. So you end up with one results directory for each year in the span. The separate results files can be easily combined, as shown below."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "350d61ed-9536-4830-8eee-0b481ceabd10",
+   "metadata": {},
+   "source": [
+    "## Set things up"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "27667834-d179-4e21-8294-7dd43cc46b11",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "from pathlib import Path\n",
+    "\n",
+    "import pandas as pd\n",
+    "\n",
+    "# importing the trove_newspaper_harvester!\n",
+    "from trove_newspaper_harvester.core import Harvester, get_metadata, prepare_query"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "73853861-8c9f-430b-8b15-73ca36aa9c30",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%%capture\n",
+    "# Load variables from the .env file if it exists\n",
+    "# Use %%capture to suppress messages\n",
+    "%load_ext dotenv\n",
+    "%dotenv"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "892af7ae-14fd-4f42-8d6b-0289b0576f10",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Insert your Trove API key\n",
+    "API_KEY = \"YOUR API KEY\"\n",
+    "\n",
+    "# Use api key value from environment variables if it is available\n",
+    "if os.getenv(\"TROVE_API_KEY\"):\n",
+    "    API_KEY = os.getenv(\"TROVE_API_KEY\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "9aaf407a-b0cf-4731-ace2-f76d9b4a2999",
+   "metadata": {},
+   "source": [
+    "## Run the harvester\n",
+    "\n",
+    "First of all we use `prepare_query` to create a base set of parameters. We'll feed it a search for the term \"anzac day\" and then add in the dates later."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "24991234-a03a-40af-91c8-f107138a9c56",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "query = 'https://trove.nla.gov.au/search/category/newspapers?keyword=\"anzac day\"'\n",
+    "query_params = prepare_query(query=query, api_key=API_KEY)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0d559f30-e620-4112-ba0d-20853e214aa9",
+   "metadata": {},
+   "source": [
+    "Next we'll loop through our desired span of years, harvesting the results each Anzac Day. For demonstration purposes I'll use a short span, harvesting results for the years 1916 to 1919. But you could just as easily harvest results from 1916 to the present."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "5958b7f7-04c3-4b1f-9a82-0fb2276e41e5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Loop through the desired span of years\n",
+    "# Note that the end of the range is not inclusive, so you have to set it to the value above the end you want,\n",
+    "# so this loop will output 1916, 1917, 1918 and 1919, but not 1920.\n",
+    "for year in range(1916, 1920):\n",
+    "    # Copy the base params\n",
+    "    params = query_params.copy()\n",
+    "    # Add the date search to the query string\n",
+    "    params[\n",
+    "        \"q\"\n",
+    "    ] = f\"{query_params['q']} date:[{year}-04-24T00:00:00Z TO {year}-04-25T00:00:00Z]\"\n",
+    "\n",
+    "    # Initialise the harvester\n",
+    "    # The data-dir parameter sets the parent directory, in this case \"anzac-day\"\n",
+    "    # The harvest-dir parameter sets the directory, within the parent directory, where the current set of results will be saved,\n",
+    "    # in this case the results directory will be named by the year\n",
+    "    harvester = Harvester(\n",
+    "        query_params=params, data_dir=\"anzac-day\", harvest_dir=str(year)\n",
+    "    )\n",
+    "\n",
+    "    # Harvest the results\n",
+    "    harvester.harvest()\n",
+    "\n",
+    "    # Convert the JSON results to CSV\n",
+    "    harvester.save_csv()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8acb581f-47fa-4e42-b542-bfdc62506cc4",
+   "metadata": {},
+   "source": [
+    "The result of this code will be a series of directories and files like this:\n",
+    "\n",
+    "```\n",
+    "- anzac-day\n",
+    "    - 1916\n",
+    "        - results.csv\n",
+    "        - metadata.json\n",
+    "        - results.ndjson\n",
+    "    - 1917\n",
+    "        - results.csv\n",
+    "        - metadata.json\n",
+    "        - results.ndjson\n",
+    "    - 1918\n",
+    "        - results.csv\n",
+    "        - metadata.json\n",
+    "        - results.ndjson\n",
+    "    - 1919\n",
+    "        - results.csv\n",
+    "        - metadata.json\n",
+    "        - results.ndjson\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "70aaac3e-7e87-4fad-a6cb-bb1c5507f518",
+   "metadata": {},
+   "source": [
+    "We can look at the results of any of the individual harvests using `get_metadata`. For example:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "9d620f18-bf41-4207-b713-ceb4459afe96",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'query_parameters': {'q': '\"anzac day\" date:[1916-04-24T00:00:00Z TO 1916-04-25T00:00:00Z]',\n",
+       "  'zone': 'newspaper',\n",
+       "  'key': \"IT'S A SECRET\",\n",
+       "  'encoding': 'json',\n",
+       "  'reclevel': 'full',\n",
+       "  'bulkHarvest': 'true'},\n",
+       " 'harvest_directory': 'anzac-day/1916',\n",
+       " 'max': 315,\n",
+       " 'text': False,\n",
+       " 'pdf': False,\n",
+       " 'image': False,\n",
+       " 'include_linebreaks': False,\n",
+       " 'date_started': '2023-03-16T02:37:24.028880+00:00',\n",
+       " 'harvester': 'trove_newspaper_harvester v0.6.5',\n",
+       " 'harvested': 315}"
+      ]
+     },
+     "execution_count": 6,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "# Get the harvest metadata for 1916\n",
+    "metadata = get_metadata(\"anzac-day/1916\")\n",
+    "\n",
+    "# This is just to obscure my API key which is embedded in the metadata\n",
+    "metadata[\"query_parameters\"][\"key\"] = \"IT'S A SECRET\"\n",
+    "\n",
+    "# Display the redacted metadata!\n",
+    "metadata"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7da50d15-842e-412b-a457-cd4c3ef9bf0f",
+   "metadata": {},
+   "source": [
+    "## Combine results\n",
+    "\n",
+    "After harvesting the data above, the results for each year will be in a separate directory. If you want to join the result sets together, you can do something like this to create a single dataframe."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "98a4e539-7f99-4cf9-9958-d0794f166e54",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>article_id</th>\n",
+       "      <th>title</th>\n",
+       "      <th>date</th>\n",
+       "      <th>page</th>\n",
+       "      <th>newspaper_id</th>\n",
+       "      <th>newspaper_title</th>\n",
+       "      <th>category</th>\n",
+       "      <th>words</th>\n",
+       "      <th>illustrated</th>\n",
+       "      <th>edition</th>\n",
+       "      <th>...</th>\n",
+       "      <th>snippet</th>\n",
+       "      <th>relevance</th>\n",
+       "      <th>corrections</th>\n",
+       "      <th>last_corrected</th>\n",
+       "      <th>tags</th>\n",
+       "      <th>comments</th>\n",
+       "      <th>lists</th>\n",
+       "      <th>text</th>\n",
+       "      <th>pdf</th>\n",
+       "      <th>images</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>102545637</td>\n",
+       "      <td>CHURCH OF ENGLAND. ANZAC DAY.</td>\n",
+       "      <td>1916-04-25</td>\n",
+       "      <td>2</td>\n",
+       "      <td>348</td>\n",
+       "      <td>Port Pirie Recorder and North Western Mail (SA...</td>\n",
+       "      <td>Article</td>\n",
+       "      <td>52</td>\n",
+       "      <td>N</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>There will be a Celebration of Holy Communion ...</td>\n",
+       "      <td>217.184250</td>\n",
+       "      <td>0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>102545649</td>\n",
+       "      <td>Advertising</td>\n",
+       "      <td>1916-04-25</td>\n",
+       "      <td>2</td>\n",
+       "      <td>348</td>\n",
+       "      <td>Port Pirie Recorder and North Western Mail (SA...</td>\n",
+       "      <td>Advertising</td>\n",
+       "      <td>823</td>\n",
+       "      <td>N</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.871224</td>\n",
+       "      <td>0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>102545658</td>\n",
+       "      <td>ANZAC DAY AT PORT PIRIE.</td>\n",
+       "      <td>1916-04-25</td>\n",
+       "      <td>2</td>\n",
+       "      <td>348</td>\n",
+       "      <td>Port Pirie Recorder and North Western Mail (SA...</td>\n",
+       "      <td>Article</td>\n",
+       "      <td>66</td>\n",
+       "      <td>N</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>Anzac Day will be officially commemorated in t...</td>\n",
+       "      <td>217.793880</td>\n",
+       "      <td>0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>1040069</td>\n",
+       "      <td>Classified Advertising</td>\n",
+       "      <td>1916-04-25</td>\n",
+       "      <td>2</td>\n",
+       "      <td>10</td>\n",
+       "      <td>The Mercury (Hobart, Tas. : 1860 - 1954)</td>\n",
+       "      <td>Advertising</td>\n",
+       "      <td>3816</td>\n",
+       "      <td>N</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.463171</td>\n",
+       "      <td>0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>1040072</td>\n",
+       "      <td>ANZAC DAY.</td>\n",
+       "      <td>1916-04-25</td>\n",
+       "      <td>8</td>\n",
+       "      <td>10</td>\n",
+       "      <td>The Mercury (Hobart, Tas. : 1860 - 1954)</td>\n",
+       "      <td>Article</td>\n",
+       "      <td>89</td>\n",
+       "      <td>N</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>May I inquire if on Anzac Day in Hobart any se...</td>\n",
+       "      <td>285.078250</td>\n",
+       "      <td>0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>5 rows × 24 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "   article_id                          title        date page  newspaper_id  \\\n",
+       "0   102545637  CHURCH OF ENGLAND. ANZAC DAY.  1916-04-25    2           348   \n",
+       "1   102545649                    Advertising  1916-04-25    2           348   \n",
+       "2   102545658       ANZAC DAY AT PORT PIRIE.  1916-04-25    2           348   \n",
+       "3     1040069         Classified Advertising  1916-04-25    2            10   \n",
+       "4     1040072                     ANZAC DAY.  1916-04-25    8            10   \n",
+       "\n",
+       "                                     newspaper_title     category  words  \\\n",
+       "0  Port Pirie Recorder and North Western Mail (SA...      Article     52   \n",
+       "1  Port Pirie Recorder and North Western Mail (SA...  Advertising    823   \n",
+       "2  Port Pirie Recorder and North Western Mail (SA...      Article     66   \n",
+       "3           The Mercury (Hobart, Tas. : 1860 - 1954)  Advertising   3816   \n",
+       "4           The Mercury (Hobart, Tas. : 1860 - 1954)      Article     89   \n",
+       "\n",
+       "  illustrated edition  ...                                            snippet  \\\n",
+       "0           N     NaN  ...  There will be a Celebration of Holy Communion ...   \n",
+       "1           N     NaN  ...                                                NaN   \n",
+       "2           N     NaN  ...  Anzac Day will be officially commemorated in t...   \n",
+       "3           N     NaN  ...                                                NaN   \n",
+       "4           N     NaN  ...  May I inquire if on Anzac Day in Hobart any se...   \n",
+       "\n",
+       "    relevance corrections last_corrected tags  comments  lists text  pdf  \\\n",
+       "0  217.184250           0            NaN    0         0      0  NaN  NaN   \n",
+       "1    0.871224           0            NaN    0         0      0  NaN  NaN   \n",
+       "2  217.793880           0            NaN    0         0      0  NaN  NaN   \n",
+       "3    0.463171           0            NaN    0         0      0  NaN  NaN   \n",
+       "4  285.078250           0            NaN    0         0      0  NaN  NaN   \n",
+       "\n",
+       "   images  \n",
+       "0     NaN  \n",
+       "1     NaN  \n",
+       "2     NaN  \n",
+       "3     NaN  \n",
+       "4     NaN  \n",
+       "\n",
+       "[5 rows x 24 columns]"
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "# A list to hold all the dataframes\n",
+    "dfs = []\n",
+    "\n",
+    "# Loop through the span of years\n",
+    "for year in range(1916, 1920):\n",
+    "    # Convert the results CSV file to a dataframe and add to the list of dfs\n",
+    "    dfs.append(pd.read_csv(Path(\"anzac-day\", str(year), \"results.csv\")))\n",
+    "\n",
+    "# Combine the dataframes into one\n",
+    "df = pd.concat(dfs)\n",
+    "\n",
+    "# View a sample\n",
+    "df.head()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "53cd2737-5809-4428-bbee-d31710d93879",
+   "metadata": {},
+   "source": [
+    "To make sure we have the combined results, we can look at the number of articles by each Anzac Day."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "46f41296-5d2d-4442-962f-b09a07a69c2b",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "1917-04-25    445\n",
+       "1918-04-25    384\n",
+       "1919-04-25    344\n",
+       "1916-04-25    315\n",
+       "Name: date, dtype: int64"
+      ]
+     },
+     "execution_count": 8,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df[\"date\"].value_counts()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "176f4b83-6a56-4118-a131-44d8e455b567",
+   "metadata": {},
+   "source": [
+    "----\n",
+    "\n",
+    "Created by [Tim Sherratt](https://timsherratt.org) ([@wragge](https://twitter.com/wragge)) for the [GLAM Workbench](https://github.com/glam-workbench/).  \n",
+    "Support this project by [becoming a GitHub sponsor](https://github.com/sponsors/wragge?o=esb).\n"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.12"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}

	article_id	title	date	page	newspaper_id	newspaper_title	category	words	illustrated	edition	...	snippet	relevance	last_corrected	text	pdf	images
0	102545637	CHURCH OF ENGLAND. ANZAC DAY.	1916-04-25	2	348	Port Pirie Recorder and North Western Mail (SA...	Article	52	N	NaN	...	There will be a Celebration of Holy Communion ...	217.184250	NaN	NaN	NaN	NaN
1	102545649	Advertising	1916-04-25	2	348	Port Pirie Recorder and North Western Mail (SA...	Advertising	823	N	NaN	...	NaN	0.871224	NaN	NaN	NaN	NaN
2	102545658	ANZAC DAY AT PORT PIRIE.	1916-04-25	2	348	Port Pirie Recorder and North Western Mail (SA...	Article	66	N	NaN	...	Anzac Day will be officially commemorated in t...	217.793880	NaN	NaN	NaN	NaN
3	1040069	Classified Advertising	1916-04-25	2	10	The Mercury (Hobart, Tas. : 1860 - 1954)	Advertising	3816	N	NaN	...	NaN	0.463171	NaN	NaN	NaN	NaN
4	1040072	ANZAC DAY.	1916-04-25	8	10	The Mercury (Hobart, Tas. : 1860 - 1954)	Article	89	N	NaN	...	May I inquire if on Anzac Day in Hobart any se...	285.078250	NaN	NaN	NaN	NaN