blumenstiel's picture
Fix app
dfb5c47
import os
import torch
import yaml
import numpy as np
import gradio as gr
from pathlib import Path
from einops import rearrange
from functools import partial
from huggingface_hub import hf_hub_download
from terratorch.cli_tools import LightningInferenceModel
# pull files from hub
token = os.environ.get("HF_TOKEN", None)
config_path = hf_hub_download(repo_id="ibm-nasa-geospatial/Prithvi-EO-2.0-300M-TL-Sen1Floods11",
filename="config.yaml", token=token)
checkpoint = hf_hub_download(repo_id="ibm-nasa-geospatial/Prithvi-EO-2.0-300M-TL-Sen1Floods11",
filename='Prithvi-EO-V2-300M-TL-Sen1Floods11.pt', token=token)
model_inference = hf_hub_download(repo_id="ibm-nasa-geospatial/Prithvi-EO-2.0-300M-TL-Sen1Floods11",
filename='inference.py', token=token)
os.system(f'cp {model_inference} .')
from inference import process_channel_group, _convert_np_uint8, load_example, run_model
def predict_on_images(data_file: str | Path, config_path: str, checkpoint: str):
try:
data_file = data_file.name
print('Path extracted from example')
except:
print('Files submitted through UI')
# Get parameters --------
print('This is the printout', data_file)
with open(config_path, "r") as f:
config_dict = yaml.safe_load(f)
# Load model ---------------------------------------------------------------------------------
lightning_model = LightningInferenceModel.from_config(config_path, checkpoint)
img_size = 512 # Size from Sen1Floods11 training
# Loading data ---------------------------------------------------------------------------------
input_data, temporal_coords, location_coords, meta_data = load_example(file_paths=[data_file])
if input_data.shape[1] == 6:
pass
elif input_data.shape[1] == 13:
input_data = input_data[:, [1,2,3,8,11,12], ...]
else:
raise Exception(f'Input data has {input_data.shape[1]} channels. Expect either 6 Prithvi channels or 13 S2L1C channels.')
if input_data.mean() > 1:
input_data = input_data / 10000 # Convert to range 0-1
# Running model --------------------------------------------------------------------------------
lightning_model.model.eval()
channels = [config_dict['data']['init_args']['bands'].index(b) for b in ["RED", "GREEN", "BLUE"]] # BGR -> RGB
pred = run_model(input_data, temporal_coords, location_coords,
lightning_model.model, lightning_model.datamodule, img_size)
if input_data.mean() < 1:
input_data = input_data * 10000 # Scale to 0-10000
# Extract RGB images for display
rgb_orig = process_channel_group(
orig_img=torch.Tensor(input_data[0, :, 0, ...]),
channels=channels,
)
out_rgb_orig = _convert_np_uint8(rgb_orig).transpose(1, 2, 0)
out_pred_rgb = _convert_np_uint8(pred).repeat(3, axis=0).transpose(1, 2, 0)
pred[pred == 0.] = np.nan
img_pred = rgb_orig * 0.6 + pred * 0.4
img_pred[img_pred.isnan()] = rgb_orig[img_pred.isnan()]
out_img_pred = _convert_np_uint8(img_pred).transpose(1, 2, 0)
outputs = [out_rgb_orig] + [out_pred_rgb] + [out_img_pred]
print("Done!")
return outputs
run_inference = partial(predict_on_images, config_path=config_path, checkpoint=checkpoint)
with gr.Blocks() as demo:
gr.Markdown(value='# Prithvi-EO-2.0 Sen1Floods11 Demo')
gr.Markdown(value='''
Prithvi-EO-2.0 is the second generation EO foundation model developed by the IBM and NASA team.
This demo showcases the fine-tuned Prithvi-EO-2.0-300M-TL model to detect water using Sentinel 2 imagery from on the [sen1floods11 dataset](https://github.com/cloudtostreet/Sen1Floods11). More details can be found [here](https://huggingface.co/ibm-nasa-geospatial/Prithvi-EO-2.0-300M-TL-Sen1Floods11).\n
The user needs to provide a Sentinel-2 L1C image with either all the 13 bands or the six Prithvi bands (Blue, Green, Red, Narrow NIR, SWIR, SWIR 2). The demo code selects the required bands.
We recommend submitting images of 500 to ~1000 pixels for faster processing time. Images bigger than 256x256 are processed using a sliding window approach which can lead to artefacts between patches.\n
Optionally, the location information is extracted from the tif files while the temporal information can be provided in the filename in the format `<date>T<time>` or `<year><julian day>T<time>` (HLS format).
Some example images are provided at the end of this page.
''')
with gr.Row():
with gr.Column():
inp_file = gr.File(elem_id='file')
# inp_slider = gr.Slider(0, 100, value=50, label="Mask ratio", info="Choose ratio of masking between 0 and 100", elem_id='slider'),
btn = gr.Button("Submit")
with gr.Row():
gr.Markdown(value='## Input image')
gr.Markdown(value='## Prediction*')
gr.Markdown(value='## Overlay')
with gr.Row():
original = gr.Image(image_mode='RGB', show_label=False, show_fullscreen_button=False)
predicted = gr.Image(image_mode='RGB', show_label=False, show_fullscreen_button=False)
overlay = gr.Image(image_mode='RGB', show_label=False, show_fullscreen_button=False)
gr.Markdown(value='\* White = flood; Black = no flood')
btn.click(fn=run_inference,
inputs=inp_file,
outputs=[original] + [predicted] + [overlay])
with gr.Row():
gr.Examples(examples=[
os.path.join(os.path.dirname(__file__), "examples/India_900498_S2Hand.tif"),
os.path.join(os.path.dirname(__file__), "examples/Spain_7370579_S2Hand.tif"),
os.path.join(os.path.dirname(__file__), "examples/USA_430764_S2Hand.tif")],
inputs=inp_file,
outputs=[original] + [predicted] + [overlay],
fn=run_inference,
cache_examples=True
)
demo.launch(share=True, ssr_mode=False)