Add version update to script and missing dependencies

sabas · sabas · commit 466ced987ec0 · 2025-09-01T17:42:46.000+02:00
diff --git a/datapackage.json b/datapackage.json
@@ -3,7 +3,7 @@
   "title": "SMDG Master Terminal Facilities List",
   "description": "Code list for terminal facilities built as an extension to UN/LOCODE",
   "homepage": "http://smdg.org/index.php/smdg-code-lists/",
-  "version": "202501.14",
+  "version": "20250716",
   "licenses": [
     {
       "name": "ODC-PDDL-1.0",
diff --git a/scripts/process.py b/scripts/process.py
@@ -1,6 +1,8 @@
 import os
 import requests
 import pandas as pd
+import re
+import json
 
 from bs4 import BeautifulSoup
 
@@ -27,6 +29,20 @@ def get_link():
     soup = BeautifulSoup(response.text, 'html.parser')
     link = soup.find_all('a', {'class': 'mtli_attachment'})
     link = link[0].get('href')
+    # Extract the date using regex
+    date_match = re.search(r'v(\d{8})\.xlsx', link)
+    if date_match:
+        new_version = date_match.group(1)
+        dpfile = 'datapackage.json'
+        with open(dpfile, 'r', encoding='utf-8') as f:
+            datapackage = json.load(f)
+
+        old_version = datapackage.get('version', 'unknown')
+        datapackage['version'] = new_version
+
+        with open(dpfile, 'w', encoding='utf-8') as f:
+            json.dump(datapackage, f, indent=2, ensure_ascii=False)
+
     return link
 
 def retrieve_content(link):
@@ -49,7 +65,7 @@ def convert_dms(dms):
     degrees = int(dms_values[0])
     minutes = int(dms_values[1])
     seconds = float(dms_values[2])
-    
+
     return dms_to_decimal(degrees, minutes, seconds, direction)
 
 def transform_csv():
@@ -76,4 +92,4 @@ def clean_up():
     link = get_link()
     retrieve_content(link)
     transform_csv()
-    clean_up()
+    clean_up()
diff --git a/scripts/requirements.txt b/scripts/requirements.txt
@@ -1,4 +1,12 @@
 requests==2.32.4
 openpyxl==3.1.5
 pandas==2.2.3
-beautifulsoup4==4.12.3
+beautifulsoup4==4.12.3
+certifi==2025.8.3
+et-xmlfile==2.0.0
+idna==3.10
+numpy==2.3.2
+python-dateutil==2.9.0.post0
+pytz==2025.2
+six==1.17.0
+urllib3==2.5.0

Original file line number	Diff line number	Diff line change
`@@ -3,7 +3,7 @@`
`3`	`3`	`"title": "SMDG Master Terminal Facilities List",`
`4`	`4`	`"description": "Code list for terminal facilities built as an extension to UN/LOCODE",`
`5`	`5`	`"homepage": "http://smdg.org/index.php/smdg-code-lists/",`
`6`		`- "version": "202501.14",`
	`6`	`+ "version": "20250716",`
`7`	`7`	`"licenses": [`
`8`	`8`	`{`
`9`	`9`	`"name": "ODC-PDDL-1.0",`