mirror of
https://github.com/dataforcanada/d4c-datapkg-statistical.git
synced 2026-06-13 14:10:55 +02:00
Process 2024-12 national address register. Still need to make some improvements
This commit is contained in:
Executable
+38
@@ -0,0 +1,38 @@
|
||||
#!/bin/bash
|
||||
|
||||
INPUT_FOLDER="${DATA_FOLDER}/national_address_register/input"
|
||||
EXTRACTED_FOLDER="${DATA_FOLDER}/national_address_register/extracted"
|
||||
|
||||
process_202412() {
|
||||
# Process 2024-12 vintage
|
||||
# Extract files
|
||||
echo "Extracting ${INPUT_FOLDER}/2024-12/202412.zip to ${EXTRACTED_FOLDER}/2024-12"
|
||||
unzip -q -n ${INPUT_FOLDER}/2024-12/202412.zip -d ${EXTRACTED_FOLDER}/2024-12
|
||||
jupyter execute process_2024_12.ipynb
|
||||
}
|
||||
|
||||
process_202406() {
|
||||
# Process 2024-06 vintage
|
||||
echo "Extracting ${INPUT_FOLDER}/2024.zip"
|
||||
unzip -q -n ${INPUT_FOLDER}/2024.zip -d ${EXTRACTED_FOLDER}/2024-06
|
||||
# Encoding is utf-8
|
||||
}
|
||||
|
||||
process_2023() {
|
||||
# Process 2023
|
||||
echo "Extracting ${INPUT_FOLDER}/2023.zip"
|
||||
unzip -q -n ${INPUT_FOLDER}/2023.zip -d ${EXTRACTED_FOLDER}/2023
|
||||
# Encoding is latin-1
|
||||
}
|
||||
|
||||
process_2022() {
|
||||
# Process 2022
|
||||
echo "Extracting ${INPUT_FOLDER}/2022.zip"
|
||||
unzip -q -n ${INPUT_FOLDER}/2022.zip -d ${EXTRACTED_FOLDER}/2022
|
||||
# Encoding is latin-1
|
||||
}
|
||||
|
||||
process_202412
|
||||
#process_202406
|
||||
#process_2023
|
||||
#process_2022
|
||||
Reference in New Issue
Block a user