In [1]:
from multiprocessing import Process
import numpy as np
import pandas as pd
import requests
from tqdm import tqdm

import cv2
import netCDF4 as nc
import matplotlib.pyplot as plt
from matplotlib.patches import Polygon

import json

from subprocess import run, DEVNULL

from torch.nn import Sequential, Sigmoid
from torch import from_numpy, inference_mode
from torch.nn import DataParallel

from monai.networks.nets import SwinUNETR
from monai.inferers import sliding_window_inference

from pytorch_lightning import LightningModule

from zipfile import ZipFile
from zipfile import BadZipFile

import xmltodict

import os
from os.path import join, exists, getsize, isfile

In [2]:
class DownloadSARSentinel:
    def __init__(self, email, 
             password,
             product_list,
             satellite="sentinel_1"
                ):
        self.password = password
        self.email = email
        self.product_list = product_list
        self.satellite = satellite
        self.raw_folder = None
        self._query_result = None

    def query_result(self):
        if not isinstance(self._query_result, pd.DataFrame):
            self._query_result = self.query_sar()
        return self._query_result
        
    def query_sar(self):
        API_URL_NAME = "https://catalogue.dataspace.copernicus.eu/odata/v1/Products?$filter=contains(Name,'{name}')"
        query_result = pd.DataFrame()

        for product in self.product_list:
            json = requests.get(API_URL_NAME.format(name=product)).json()
            response_result = pd.DataFrame.from_dict(json['value'])

            if not response_result.empty:
                print("Found:", product)
                query_result = pd.concat([query_result, response_result])   
                #yield response_result
            else:
                print("Could not find: ", product)

        return query_result
        
    @staticmethod
    def create_folder(folder_path, original_name):
        if not folder_path:
            folder_path = join(os.getcwd(), original_name)
            if not exists(folder_path):
                os.mkdir(folder_path)

        assert exists(folder_path), f"Path not found: {folder_path}"
        return folder_path

    @staticmethod
    def is_downloaded(sar_name, folder):
        sar_path = join(folder, sar_name + ".zip")
        if exists(sar_path):
            #if getsize(sar_path) > 5E9: #ver o tamanho do arquivo para baixar arquivos incompletos
            return True
        return False

    def return_headers(self):
        token_url = 'https://identity.dataspace.copernicus.eu/auth/realms/CDSE/protocol/openid-connect/token'
        headers = {'Content-Type': 'application/x-www-form-urlencoded'}
        data = {
            'grant_type': 'password',
            'username': self.email,
            'password': self.password,
            'client_id': 'cdse-public'
        }
        token_response = requests.post(token_url, headers=headers, data=data).json()
        token_url = token_response["access_token"]
        download_headers = {"Authorization": f"Bearer {token_url}"}
        return download_headers

    def download_products(self, folder, overwrite=False):
        download_url = "https://zipper.dataspace.copernicus.eu/odata/v1/Products({product_id})/$value"

        for index, product in self.query_result().iterrows():
            path_product = join(folder, product["Name"] + ".zip")               
            if not DownloadSARSentinel.is_downloaded(product["Name"], folder) or overwrite:
                session = requests.Session()
                session.headers.update(self.return_headers())
                response = session.get(download_url.format(product_id=product["Id"]), headers=self.return_headers(), stream=True)
                total_size = int(response.headers.get('Content-Length', 0))
                progress_bar = tqdm(total=total_size, unit='B', unit_scale=True, desc=f'Downloading: {product["Name"]}', leave=True)
    
                with open(path_product, "wb") as file:
                    for chunk in response.iter_content(chunk_size=8192):
                        if chunk:
                            file.write(chunk)
                            progress_bar.update(len(chunk))
                progress_bar.reset()




        

In [3]:
QUERY_CSV_PATH = "/mnt/camobi_2/PHMG/Sentinel_Acquisition/New_sar_img.csv"
FILE_NAME_COLUMN = "NOME DO ARQUIVO"
RAW_SAFE_FILE = "/mnt/camobi_process/new_data/new_SAR_img"
UNZIP_SAFE_FILE = "/mnt/camobi_process/new_data/unzip_sar_img"
query_sar = pd.read_csv(QUERY_CSV_PATH, header=0)[FILE_NAME_COLUMN]

sar_list = []

for sar_name in query_sar:
    sar_path = join(UNZIP_SAFE_FILE, sar_name + ".SAFE")
    if not exists(sar_path):
        sar_list.append(sar_name)
#print(len(sar_list))

new_products = DownloadSARSentinel("pedro.meirelles@ufba.br", "Thermal1234@", product_list=sar_list)
new_products.query_result()

new_products.download_products(folder="/mnt/camobi_process/new_data/new_SAR_img")

Found: S1B_IW_SLC__1SDV_20210120T080527_20210120T080554_025235_030137_BB07
Found: S1A_IW_SLC__1SDV_20170810T024712_20170810T024738_017855_01DEF7_445E
Found: S1A_IW_SLC__1SDV_20170729T024712_20170729T024737_017680_01D9A0_A8A3
Found: S1A_IW_SLC__1SDV_20210612T235346_20210612T235415_038314_048582_23F3
Found: S1B_IW_SLC__1SDV_20211003T014926_20211003T014953_028965_0374DA_4688
Found: S1B_IW_SLC__1SDV_20211121T142946_20211121T143013_029687_038B19_5510
Found: S1A_IW_SLC__1SDV_20210805T000201_20210805T000228_039087_049CB9_D205
Found: S1A_IW_SLC__1SDV_20170709T000134_20170709T000201_017387_01D0AA_205D
Found: S1B_IW_SLC__1SDV_20190325T081332_20190325T081359_015508_01D0FD_EBAF
Found: S1A_IW_SLC__1SDV_20200203T002425_20200203T002453_031081_039239_CC57
Found: S1A_IW_SLC__1SSV_20151213T143637_20151213T143704_009025_00CF19_09E6
Found: S1A_IW_SLC__1SDV_20170717T024711_20170717T024736_017505_01D444_DB4F
Found: S1A_IW_SLC__1SDV_20170326T023848_20170326T023915_015857_01A210_CDC3
Found: S1A_IW_SLC__1SDV_2

Downloading: S1B_IW_SLC__1SDV_20211121T142946_20211121T143013_029687_038B19_5510.SAFE:   0%|          | 0.00/7.83G [00:00<?, ?B/s]

OSError: [Errno 28] No space left on device

In [None]:
downlaod_data = DownloadSARSentinel("pedro.meirelles@ufba.br", "Thermal1234@", product_list=list(query_sar))

In [4]:
class SentinelProduct:
    def __init__(self, name, file_path, nc_graph_path,  rect_corners=None):
        self.name = name
        self.rect_corners = rect_corners
        self.file_path = file_path
        self.nc_graph_path = nc_graph_path
        self.unzip_path = None
        self.netcdf_path = None

    def unzip(self, unzip_folder):
        assert exists(unzip_folder), f"Folder \"{unzip_folder}\" does not exist!"
        self.unzip_path = join(unzip_folder, self.name) 

        try:
            print("Unziping:", self.name)
            with ZipFile(self.file_path, 'r') as zip_ref:
                zip_ref.extractall(self.unzip_path)
        except BadZipFile:
            print(f"Imposible to unzip: {self.name}. file is incomplete or corrupted!")

    def edit_zip_to_nc(self, netcdf_folder):
        with open(self.nc_graph_path) as arquivo:
            dados = xmltodict.parse(arquivo.read())

        if not self.unzip_path:
            input_path = self.unzip_path
        else:
            input_path = self.file_path

        self.netcdf_path = join(netcdf_folder, self.name + ".nc")

        dados['graph']['node'][0]['parameters']['file'] = input_path 
        dados['graph']['node'][-1]['parameters']['file'] = self.netcdf_path 

        with open(self.nc_graph_path, 'w') as arquivo:
            arquivo.write(xmltodict.unparse(dados, pretty=True))

    def convert_to_netcdf4(self, gpt_path, netcdf_folder):
        self.edit_zip_to_nc(netcdf_folder)
        shell = run([gpt_path, self.nc_graph_path])#, stdout=DEVNULL, stderr=DEVNULL)



In [5]:
SAR_TO_NC_GRAPH = "/mnt/camobi_2/PHMG/Sentinel_Acquisition/graphs/ZIP_to_NC.xml"
PATH_TO_GPT = "/home/camobi/snap/bin/gpt"
NETCDF_FOLER = "/mnt/camobi_2/PHMG/Sentinel_Acquisition/netcdf_folder"
UNZIP_FOLDER = "/mnt/camobi_2/PHMG/Sentinel_Acquisition/unzip_folder"


product_name = pd.read_csv(QUERY_CSV_PATH, header=0)[FILE_NAME_COLUMN][0][:-5]
product_path = join("/mnt/camobi_2/PHMG/Sentinel_Acquisition/raw_folder", product_name + ".SAFE.zip")

product = SentinelProduct(product_name, product_path, SAR_TO_NC_GRAPH)
product.unzip(UNZIP_FOLDER)
product.convert_to_netcdf4(PATH_TO_GPT, NETCDF_FOLER)

Unziping: S1A_IW_SLC__1SDV_20141004T154823_20141004T154851_002682_002FE4_C094
Imposible to unzip: S1A_IW_SLC__1SDV_20141004T154823_20141004T154851_002682_002FE4_C094. file is incomplete or corrupted!


INFO: org.esa.snap.core.gpf.operators.tooladapter.ToolAdapterIO: Initializing external tool adapters
INFO: org.esa.s2tbx.dataio.gdal.GDALVersion: GDAL not found on system. Internal GDAL 3.2.1 from distribution will be used. (f0)
INFO: org.esa.s2tbx.dataio.gdal.GDALVersion: Internal GDAL 3.2.1 set to be used by SNAP.
INFO: org.esa.snap.core.util.EngineVersionCheckActivator: Please check regularly for new updates for the best SNAP experience.
INFO: org.esa.s2tbx.dataio.gdal.GDALVersion: Internal GDAL 3.2.1 set to be used by SNAP.


Executing processing graph


SEVERE: org.esa.snap.core.dataio.ProductIO: Error attempting to read /mnt/camobi_2/PHMG/Sentinel_Acquisition/raw_folder/S1A_IW_SLC__1SDV_20141004T154823_20141004T154851_002682_002FE4_C094.SAFE.zip with plugin reader org.esa.s2tbx.dataio.s2.ortho.plugins.Sentinel2L1CProduct_Multi_UTM41N_ReaderPlugIn@61bfc9bf
java.lang.IllegalStateException: java.lang.reflect.InvocationTargetException
	at org.esa.s2tbx.dataio.VirtualDirEx.build(VirtualDirEx.java:101)
	at org.esa.s2tbx.dataio.s2.filepatterns.S2NamingConventionUtils.transformToSentinel2VirtualPath(S2NamingConventionUtils.java:307)
	at org.esa.s2tbx.dataio.s2.ortho.S2ProductCRSCache$S2ProductCRSCacheEntry.<init>(S2ProductCRSCache.java:57)
	at org.esa.s2tbx.dataio.s2.ortho.S2ProductCRSCache.ensureIsCached(S2ProductCRSCache.java:156)
	at org.esa.s2tbx.dataio.s2.ortho.S2OrthoProductReaderPlugIn.getDecodeQualification(S2OrthoProductReaderPlugIn.java:101)
	at org.esa.snap.core.dataio.ProductIO.getProductReaderForInput(ProductIO.java:304)
	at org

 done.


SEVERE: org.esa.snap.core.dataio.ProductIO: Error attempting to read /mnt/camobi_2/PHMG/Sentinel_Acquisition/raw_folder/S1A_IW_SLC__1SDV_20141004T154823_20141004T154851_002682_002FE4_C094.SAFE.zip with plugin reader org.esa.s2tbx.dataio.s2.ortho.plugins.Sentinel2L1CProduct_Multi_UTM59N_ReaderPlugIn@4a2929a4
java.lang.IllegalStateException: java.lang.reflect.InvocationTargetException
	at org.esa.s2tbx.dataio.VirtualDirEx.build(VirtualDirEx.java:101)
	at org.esa.s2tbx.dataio.s2.filepatterns.S2NamingConventionUtils.transformToSentinel2VirtualPath(S2NamingConventionUtils.java:307)
	at org.esa.s2tbx.dataio.s2.ortho.S2ProductCRSCache$S2ProductCRSCacheEntry.<init>(S2ProductCRSCache.java:57)
	at org.esa.s2tbx.dataio.s2.ortho.S2ProductCRSCache.ensureIsCached(S2ProductCRSCache.java:156)
	at org.esa.s2tbx.dataio.s2.ortho.S2OrthoProductReaderPlugIn.getDecodeQualification(S2OrthoProductReaderPlugIn.java:101)
	at org.esa.snap.core.dataio.ProductIO.getProductReaderForInput(ProductIO.java:304)
	at org

In [15]:
class PedroNet(LightningModule): #out_channels = numero de classes
    def __init__(self, img_size, lr,
                 depths=(2, 2, 2, 2), 
                 num_heads=(3, 6, 12, 24), 
                 feature_size=24, 
                 norm_name='instance', 
                 drop_rate=0.0, 
                 attn_drop_rate=0.0, 
                 dropout_path_rate=0.0, 
                 normalize=True, 
                 use_checkpoint=False, 
                 downsample='merging', 
                 use_v2=False 
                 ):
        super().__init__()
        self.model = Sequential(SwinUNETR(spatial_dims=2,
                                    in_channels=1,
                                    out_channels=1,
                                    depths=depths,
                                    img_size=img_size,
                                    feature_size=feature_size,
                                    drop_rate=drop_rate,
                                    num_heads=num_heads,
                                    norm_name=norm_name,
                                    attn_drop_rate=attn_drop_rate,
                                    dropout_path_rate=dropout_path_rate,
                                    normalize=normalize,
                                    use_checkpoint=use_checkpoint,
                                    downsample=downsample,
                                    #use_v2=use_v2, apenas para versões mais recentes
                                    ))
    def forward(self, x):
        return self.model(x)
    
    def netcdf_inferece(self, nc_product):
        torch_img = from_numpy(np.asarray(nc_product.nc_img)).to("cuda")
        torch_img = torch_img.unsqueeze(0).unsqueeze(0)

        with inference_mode():
            model_img = sliding_window_inference(torch_img, 
                                            roi_size=(512),
                                            sw_batch_size=20, 
                                            predictor=DataParallel(self.model), 
                                            mode='constant',
                                            overlap=0.8,
                                            progress=True
                                            )

            sigmoid_fn = Sigmoid()
            model_img = sigmoid_fn(model_img)
            model_img = model_img.to("cpu").squeeze()
        return model_img

class NetcdfProduct:
    def __init__(self, product, image_variable='Sigma0_VV_db'):
        self.product = product
        self.name = product.filepath().split("/")[-1].split(".")[0]
        self.image_variable = image_variable
        self.nc_img = product.variables[self.image_variable][:]
    
    def __str__(self):
        return self.name

    def create_img(self, folder_path):
        img_path = join(folder_path, self.name + ".png")
        normalized_img = ((self.nc_img - np.min(self.nc_img)) / (np.max(self.nc_img) - np.min(self.nc_img))) * 255
        cv2.imwrite(img_path, normalized_img)
    
    @staticmethod
    def create_polygons(mask):
        edited_contours = []
        binary_image = np.array(mask)
        
        contours, hierarchy = cv2.findContours(binary_image.astype(np.uint8), cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
        
        for poly in contours:
            if len(poly) > 50:
                approx = cv2.approxPolyDP(poly, 0.8, True)
                approx = np.squeeze(approx)
                edited_contours.append(approx)
        return edited_contours
    
    @staticmethod
    def mask_to_bool(probs, threshold=0.5):
        mask = np.asarray(probs)
        mask[mask > threshold] = True
        mask[mask < threshold] = False
        return mask

    def probs_to_labelme(self, probs, folder, threshold=0.5):
        mask = NetcdfProduct.mask_to_bool(probs, threshold)
        masked_polygons = NetcdfProduct.create_polygons(mask)
        labelme_format = {"version": "5.1.1",
                          "flags": {},
                          "shapes": [],
                          "imagePath": f"..\\Sar_img\\{self.name}.png",  # Update with your image filename
                          "imageData": None,
                          "imageHeight": self.product.dimensions["y"].size,
                          "imageWidth": self.product.dimensions["x"].size
                          }

        for patch in masked_polygons:
            labelme_format["shapes"].append({
                "label": "oil", 
                "points": patch.squeeze().tolist(),
                "group_id": None,
                "description": "",
                "shape_type": "polygon",
                "flags": {}
            })

        auto_labels_path = join(folder, f"{self.name}.json")
        with open(auto_labels_path, 'w') as json_file:
            json.dump(labelme_format, json_file, indent=2)
        print(f"Label \"{self.name}.json\" created!")


In [12]:
NETCDF_PRODUCT_PATH = "/mnt/camobi_process/new_data/images_nc"

list_nc_product = []

for nc_data in tqdm(os.listdir(NETCDF_PRODUCT_PATH)):
    nc_data_path = join(NETCDF_PRODUCT_PATH, nc_data)
    nc_img = nc.Dataset(nc_data_path, 'r')
    netcdf_sar = NetcdfProduct(nc_img)
    list_nc_product.append(netcdf_sar)
    #netcdf_sar.create_img("/mnt/camobi_2/PHMG/Sentinel_Acquisition/img_folder")

100%|██████████| 69/69 [03:19<00:00,  2.88s/it]


In [14]:
IMAGE_FOLDER = "/mnt/camobi_2/PHMG/Sentinel_Acquisition/img_folder"

for nc_image in tqdm(list_nc_product):
    nc_image.create_img(IMAGE_FOLDER)

100%|██████████| 69/69 [04:10<00:00,  3.63s/it]


In [16]:
LABELS_FOLDER = "/mnt/camobi_2/PHMG/Sentinel_Acquisition/auto_labels"
WEIGHTS_MODEL = "/mnt/camobi_2/PHMG/PedroSwinNet/Model_512Img_24Feature_(2, 2, 2, 2)depths_0.0attnDrop_(3, 6, 12, 24)Heads_30.000000Lr_0drop_v1/model-Val_loss=0.003714-Val_Precision=0.973-Recall=0.971-Val_F1_Score=0.972.ckpt"
loaded_model = PedroNet.load_from_checkpoint(WEIGHTS_MODEL)


for nc_image in tqdm(list_nc_product):
    probs = loaded_model.netcdf_inferece(nc_image)
    nc_image.probs_to_labelme(probs, LABELS_FOLDER)

100%|██████████| 156/156 [00:59<00:00,  2.63it/s]
  1%|▏         | 1/69 [01:00<1:09:00, 60.89s/it]

Label "A8A3.json" created!


100%|██████████| 25/25 [00:08<00:00,  2.80it/s]
  3%|▎         | 2/69 [01:10<34:09, 30.60s/it]  

Label "2EBC.json" created!


100%|██████████| 6/6 [00:02<00:00,  2.83it/s]
  4%|▍         | 3/69 [01:12<19:22, 17.62s/it]

Label "D205.json" created!


100%|██████████| 169/169 [01:03<00:00,  2.65it/s]
  6%|▌         | 4/69 [02:18<39:35, 36.54s/it]

Label "4DB8.json" created!


100%|██████████| 169/169 [01:03<00:00,  2.65it/s]
  7%|▋         | 5/69 [03:23<50:11, 47.06s/it]

Label "0868.json" created!


100%|██████████| 171/171 [01:04<00:00,  2.63it/s]
  9%|▊         | 6/69 [04:30<56:27, 53.77s/it]

Label "F8D3.json" created!


100%|██████████| 169/169 [01:03<00:00,  2.65it/s]
 10%|█         | 7/69 [05:36<59:37, 57.71s/it]

Label "C094.json" created!


 93%|█████████▎| 157/169 [00:59<00:04,  2.64it/s]
 10%|█         | 7/69 [06:35<58:26, 56.56s/it]


KeyboardInterrupt: 

100%|██████████| 185/185 [01:09<00:00,  2.66it/s]


In [89]:

#plt.imshow(test_mask)
test_mask_1 = np.array(test_mask)
test_mask_1[netcdf_sar.nc_img.mask] = np.nan
#plt.imshow(test_mask_1)
netcdf_sar.probs_to_labelme(test_mask_1, LABELS_FOLDER)

  contours, hierarchy = cv2.findContours(binary_image.astype(np.uint8), cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)


Label "D0F5.json" created!


In [8]:
class SentinelAcquisition:
    def __init__(self, data):
        self.data = data




In [None]:
sar_data = SentinelAcquisition()