download data and fix xyz file import

mundialis · Feb 15, 2024 · 80e4104 · 80e4104
1 parent b4b6da6
commit 80e4104
Show file tree

Hide file tree

Showing 2 changed files with 102 additions and 10 deletions.
diff --git a/src/grass_gis_helpers/data_import.py b/src/grass_gis_helpers/data_import.py
@@ -30,8 +30,8 @@
 
 import grass.script as grass
 
-from grass_gis_helpers.general import communicate_grass_command
-
+from .cleanup import rm_vects
+from .general import communicate_grass_command
 from .raster import adjust_raster_resolution, rename_raster
 
 
@@ -70,6 +70,41 @@ def downloaad_and_import_tindex(tindex_url, output, download_dir):
         os.chdir(cur_dir)
 
 
+def get_list_of_tindex_locations(tindex, aoi=None):
+    """Select the locations of the tindex which overlap with the AOI or the
+    current region
+
+    Args:
+        tindex (str): Name of the tindex vector map
+        aoi (str): Name of the AOI vector map
+    Returns:
+        (list): List with locations which overlap with the AOI or the current
+                region
+    """
+    tindex_clipped = f"clipped_tindex_vect_{grass.tempname(8)}"
+    try:
+        v_clip_kwargs = {
+            "input": tindex,
+            "output": tindex_clipped,
+            "flags": "d",
+            "quiet": True,
+        }
+        if aoi:
+            v_clip_kwargs["clip"] = aoi
+        else:
+            v_clip_kwargs["flags"] += "r"
+        grass.run_command("v.clip", **v_clip_kwargs)
+        # grass.vector_db_select(tindex_clipped, columns="location")
+        tiles = [
+            val[0] for val in grass.vector_db_select(
+                tindex_clipped, columns="location"
+            )["values"].values()
+        ]
+    finally:
+        rm_vects([tindex_clipped])
+    return tiles
+
+
 def import_local_raster_data(
     aoi,
     basename,
@@ -198,16 +233,16 @@ def get_xyz_file_infos(xyz_file):
     # z.B.: Pixel Size = (1.000000000000000,1.000000000000000)
     res = float(stdout.split("Pixel Size = (")[1].split(",")[0])
     # get bbox
-    bbox_w = float(
+    bbox_x1 = float(
         stdout.split("Upper Left")[1].replace("(", "").split(",")[0].strip()
     )
-    bbox_e = float(
+    bbox_x2 = float(
         stdout.split("Upper Right")[1].replace("(", "").split(",")[0].strip()
     )
-    bbox_s = float(
+    bbox_y1 = float(
         stdout.split("Upper Left")[1].split(",")[1].split(")")[0].strip()
     )
-    bbox_n = float(
+    bbox_y2 = float(
         stdout.split("Lower Left")[1].split(",")[1].split(")")[0].strip()
     )
     # check if shift is needed
@@ -216,10 +251,10 @@ def get_xyz_file_infos(xyz_file):
     shift_needed = True
     half_res = res / 2.0
     if (
-        bbox_w % res == half_res
-        and bbox_e % res == half_res
-        and bbox_s % res == half_res
-        and bbox_n % res == half_res
+        bbox_x1 % res != half_res
+        and bbox_x2 % res != half_res
+        and bbox_y1 % res != half_res
+        and bbox_y2 % res != half_res
     ):
         shift_needed = False
     # get region to xyz file

diff --git a/src/grass_gis_helpers/open_geodata_germany/download_data.py b/src/grass_gis_helpers/open_geodata_germany/download_data.py
@@ -21,7 +21,11 @@
 #
 ############################################################################
 
+from multiprocessing.pool import ThreadPool
 import os
+import requests
+from zipfile import ZipFile
+
 import grass.script as grass
 
 
@@ -47,3 +51,56 @@ def check_download_dir(download_dir):
             os.makedirs(download_dir)
     grass.message(f"Download directory: {download_dir}")
     return download_dir
+
+
+def url_response(url):
+    """URL response function which is used by download_data_using_threadpool
+
+    Arsg:
+        url (str): data download url
+    Return:
+        url (str): Return the url for printing
+    """
+    filename = os.path.basename(url)
+    response = requests.get(url, stream=True)
+    with open(str(filename), "wb") as f:
+        for chunk in response:
+            f.write(chunk)
+    return url
+
+
+def download_data_using_threadpool(urls, download_dir, nprocs):
+    """Download data from urls via ThreadPool
+
+    Args:
+        urls (list): List with data download urls
+        download_dir (str): Path to directory where the data should be
+                            downloaded
+        nprocs (int): The number of worker threads to use; If processes is None
+                      then the number returned by os.cpu_count() is used.
+    """
+    cur_dir = os.getcwd()
+    try:
+        os.chdir(download_dir)
+        pool = ThreadPool(nprocs)
+        results = pool.imap_unordered(url_response, urls)
+        grass.message(_("Downloading data of url:"))
+        for result in results:
+            print(result)
+    finally:
+        os.chdir(cur_dir)
+
+
+def extract_compressed_files(file_names, download_dir):
+    """Extract compressed files to download directory.
+    Args:
+        file_names (list): List with compressed e.g. zip file names which
+                           are stored in the download_dir
+        download_dir (str): Path to directory where the data should be
+                            downloaded
+    """
+    for file_name in file_names:
+        file = os.path.join(download_dir, file_name)
+        with ZipFile(file, "r") as zipObj:
+            # Extract all the contents of zip file in current directory
+            zipObj.extractall(download_dir)