{ "cells": [ { "cell_type": "code", "execution_count": 5, "id": "dacb31a5", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Reading /home/jovyan/work/process-statcan-data/data/geosuite/extracted/2021_92-150-X_eng/PN.csv\n" ] } ], "source": [ "#!/usr/bin/env python\n", "# coding: utf-8\n", "import os\n", "import sys\n", "\n", "import geopandas as gpd\n", "import pandas as pd\n", "from sqlalchemy import create_engine\n", "from sqlalchemy import text\n", "\n", "placenames_2021_csv = \"/home/jovyan/work/process-statcan-data/data/geosuite/extracted/2021_92-150-X_eng/PN.csv\"\n", "\n", "DATABASE = os.environ.get(\"POSTGRES_DB\")\n", "HOST = os.environ.get(\"WAREHOUSE_PG_HOST\")\n", "USER = os.environ.get(\"POSTGRES_USER\")\n", "PASSWORD = os.environ.get(\"POSTGRES_PASSWORD\")\n", "\n", "#engine = create_engine(f\"postgresql://{USER}:{PASSWORD}@{HOST}:5432/{DATABASE}\")\n", "\n", "print(f\"Reading {placenames_2021_csv}\")\n", "placenames = pd.read_csv(filepath_or_buffer=placenames_2021_csv,\n", " encoding='latin-1',\n", " usecols=['PNdguid', 'PNname', 'PNsource', 'PNrplat', 'PNrplong'])\n", "\n", "placenames.rename(columns={\n", " 'PNdguid': 'pn_dguid',\n", " 'PNname': 'pn_name',\n", " 'PNsource': 'pn_source',\n", " 'PNrplat': 'latitude',\n", " 'PNrplong': 'longitude'\n", "}, inplace=True)" ] }, { "cell_type": "code", "execution_count": 7, "id": "d2d4d385", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "rec.array([(4269, '2021S0515005422', 'Cascapédia\\x96Saint-Jules', 1, 48.25, -65.9166667)],\n", " dtype=[('index', '