In [1]:
import pandas as pd
import numpy as np
from process import *

In [2]:
# Instantiate helper
ftp_h = FTPHelper(URL, USERNAME, PASSWORD)

In [3]:
# Create a pandas.df to store the list of available files.
df = pd.DataFrame(data=ftp_h.list_files(), columns=["name"])

# Rearrange the content of the pandas df.
df = pd.concat([df, df["name"].str.split("_", expand=True)], axis=1)
df = df.rename(columns = {
    0:"dataset", 1:"version", 2:"res", 3:"filetype", 4:"crs", 
    5:"dep", 6:"date"})

# Loc the dataset of interest RGE Alti 5m.
df = df.loc[(df.dataset == "RGEALTI") & (df.res == "1M")]

# Clean the date and set the name as index.
df['date'] = df['date'].apply(lambda x:x[:-3])
df = df.set_index("name")

df

Unnamed: 0_level_0,dataset,version,res,filetype,crs,dep,date
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D001_2020-11-13.7z,RGEALTI,2-0,1M,ASC,LAMB93-IGN69,D001,2020-11-13
RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D002_2020-09-04.7z,RGEALTI,2-0,1M,ASC,LAMB93-IGN69,D002,2020-09-04
RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D003_2021-08-25.7z,RGEALTI,2-0,1M,ASC,LAMB93-IGN69,D003,2021-08-25
RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D004_2021-08-04.7z.001,RGEALTI,2-0,1M,ASC,LAMB93-IGN69,D004,2021-08-04.7z.
RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D004_2021-08-04.7z.002,RGEALTI,2-0,1M,ASC,LAMB93-IGN69,D004,2021-08-04.7z.
...,...,...,...,...,...,...,...
RGEALTI_2-0_1M_ASC_RGR92UTM40S-REUN89_D974_2016-03-11.7z,RGEALTI,2-0,1M,ASC,RGR92UTM40S-REUN89,D974,2016-03-11
RGEALTI_2-0_1M_ASC_RGSPM06U21-STPM50_D975_2017-03-27.7z,RGEALTI,2-0,1M,ASC,RGSPM06U21-STPM50,D975,2017-03-27
RGEALTI_2-0_1M_ASC_WGS84UTM20-GUAD88_D971_2014-01-15.7z,RGEALTI,2-0,1M,ASC,WGS84UTM20-GUAD88,D971,2014-01-15
RGEALTI_2-0_1M_ASC_WGS84UTM20-GUAD92LD_D971_2013-12-11.7z,RGEALTI,2-0,1M,ASC,WGS84UTM20-GUAD92LD,D971,2013-12-11


In [4]:
ROI = 'Auvergne-Rhône-Alpes'

deps_of_interest = REGIONS[ROI]
deps_of_interest = ["D0"+dn for dn in deps_of_interest]

# Loc lines of interest in the pandas.df.
dfi = df.loc[df.dep.isin(deps_of_interest)]
filenames = dfi.index.to_list()

In [5]:
for num, filename in enumerate(filenames):
    if filename in os.listdir(TEMP_ZIP):
        print(filename, "already downloaded")
    else:
        ftp_h.download_file(filename, TEMP_ZIP)

RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D001_2020-11-13.7z already downloaded
RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D003_2021-08-25.7z already downloaded
RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D007_2021-11-02.7z already downloaded


  0%|          | 0.00/5.96G [00:00<?, ?B/s]

RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D015_2019-12-10.7z is downloaded.


  0%|          | 0.00/5.26G [00:00<?, ?B/s]

RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D026_2021-11-02.7z is downloaded.


  0%|          | 0.00/6.00G [00:00<?, ?B/s]

RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D038_2020-11-13.7z.001 is downloaded.


  0%|          | 0.00/366M [00:00<?, ?B/s]

RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D038_2020-11-13.7z.002 is downloaded.


  0%|          | 0.00/4.07G [00:00<?, ?B/s]

RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D042_2021-01-22.7z is downloaded.


  0%|          | 0.00/5.61G [00:00<?, ?B/s]

RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D043_2020-01-06.7z is downloaded.


  0%|          | 0.00/5.48G [00:00<?, ?B/s]

RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D063_2021-01-22.7z is downloaded.


  0%|          | 0.00/2.36G [00:00<?, ?B/s]

RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D069_2020-11-13.7z is downloaded.


  0%|          | 0.00/6.00G [00:00<?, ?B/s]

RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D073_2020-10-15.7z.001 is downloaded.


  0%|          | 0.00/721M [00:00<?, ?B/s]

RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D073_2020-10-15.7z.002 is downloaded.


  0%|          | 0.00/4.67G [00:00<?, ?B/s]

RGEALTI_2-0_1M_ASC_LAMB93-IGN69_D074_2020-10-15.7z is downloaded.


In [None]:
    extract_rge5m(filename)
    asc_paths_list = get_path_asc_paths(filename)
    result_path = os.path.join(DATAPATH, "result")
    mosaic_name = f"mymosaic_{ROI}_{num+1}.tif"
    mosaic_path = create_rge_mosaic(asc_paths_list, result_path, mosaic_name, 2154)