import spaces
import numpy as np
from ultralytics import YOLO
import os
import json
from PIL import Image
from ultralytics import SAM  
import cv2
import torch
from transformers import TrOCRProcessor, VisionEncoderDecoderModel
import rasterio
import rasterio.features
from shapely.geometry import shape
import pandas as pd
import osmnx as ox
from osgeo import gdal, osr
import geopandas as gpd
from rapidfuzz import process, fuzz
from huggingface_hub import hf_hub_download
from config import OUTPUT_DIR
from pathlib import Path
from PIL import Image
from .helpers import box_inside_global,nms_iou,non_max_suppression,tile_image_with_overlap,compute_iou,merge_boxes,box_area,is_contained,merge_boxes_iterative,get_corner_points,sample_negative_points_outside_boxes,get_inset_corner_points,processYOLOBoxes,prepare_tiles,merge_tile_masks,chunkify,img_shape,best_street_match
from pyproj import Transformer
import shutil
import re
from shapely.ops import nearest_points
from geopy.distance import geodesic


# Global cache
_trocr_processor = None
_trocr_model = None
_trocr_device = torch.device("cuda" if torch.cuda.is_available() else "cpu")


def run_inference(tile_dict, gcp_path,user_crs, city_name, score_th, hist_th, hist_dic):
    IMAGE_FOLDER = os.path.join(OUTPUT_DIR, "blobs")
    CSV_FILE = os.path.join(OUTPUT_DIR, "annotations.csv")
    MASK_FILE = os.path.join(OUTPUT_DIR, "mask.tif")
    

    if os.path.exists(IMAGE_FOLDER):
        shutil.rmtree(IMAGE_FOLDER)
    os.makedirs(IMAGE_FOLDER, exist_ok=True)

    if os.path.exists("tmp"):
        shutil.rmtree("tmp")
    os.makedirs("tmp", exist_ok=True)

    
    if os.path.exists(CSV_FILE):
        os.remove(CSV_FILE)
    if os.path.exists(MASK_FILE):
        os.remove(MASK_FILE)


    log = ""
    if tile_dict is None:
        yield "No tile selected", None
        return
    
    image_path = tile_dict["tile_path"]
    coords = tile_dict["coords"] # (x_start, y_start, x_end, y_end)

    print(f"Tile path: {image_path}; Tile coords: {coords}")
    
    # ==== TEXT DETECTION ====
    for msg in getBBoxes(image_path):
        log += msg + "\n"
        yield log, None
    for msg in getSegments(image_path):
        if msg.endswith(".tif"):
            log += f"Mask saved at {msg}.\n"
            yield log, msg
        else:
            log += msg + "\n"
            yield log, None
        if "No labels detected" in msg:
            stop_pipeline = True
            break
        else:
            stop_pipeline=False

    if stop_pipeline:
        yield log + "Pipeline stopped: no text segments found.\n", None
        return

    for msg in extractSegments(image_path):
        log += msg + "\n"
        yield log, None

    # === TEXT RECOGNITION ===
    for msg in blobsOCR_all():
        log += msg + "\n"
        yield log, None
    
    # === ADD GEO DATA ===
    
    for msg in georefTile(coords,gcp_path):
        log += msg + "\n"
        yield log, None
    for msg in extractCentroids(image_path):
        log += msg + "\n"
        yield log, None
    for msg in extractStreetNet(city_name, user_crs):
        log += msg + "\n"
        yield log, None
    
    # === POST OCR ===
    all_csvs = []

    for msg in fuzzyMatch(score_th, tile_dict):
        if isinstance(msg, list):
            # msg is [street_matches_csv, osm_csv]
            all_csvs.extend(msg)  # append these CSV paths
            log += "Finished! CSVs saved at:\n"
            for f in msg:
                log += f"  - {f}\n"
            yield log, None
        else:
            log += msg + "\n"
            yield log, None

    if hist_dic is not None:
        # Run fuzzy match against historic street names
        for msg in fuzzyMatchHist(hist_dic, hist_th,tile_dict):
            if isinstance(msg, list):
                all_csvs.extend(msg)  # append historic CSV as well
                log += "Historic fuzzy matching finished! CSVs saved at:\n"
                for f in msg:
                    log += f"  - {f}\n"
                yield log, all_csvs  # now yields all three CSVs together
            else:
                log += msg + "\n"
                yield log, None
    else:
        # If historic matching is skipped, yield the OSM match files
        yield log, all_csvs


def load_trocr_model():
    """Load TrOCR into GPU if not cached."""
    global _trocr_processor, _trocr_model
    if _trocr_model is None:
        _trocr_processor = TrOCRProcessor.from_pretrained("microsoft/trocr-base-str")
        _trocr_model = VisionEncoderDecoderModel.from_pretrained("muk42/trocr_streets")
        _trocr_model.to(_trocr_device).eval()
    return _trocr_processor, _trocr_model

@spaces.GPU
def getBBoxes(image_path, tile_size=256, overlap=0.3, confidence_threshold=0.25):
    yield f"DEBUG: Received image_path: {image_path}"
    image = cv2.imread(image_path)
    H, W, _ = image.shape
    
    yolo_weights = hf_hub_download(
        repo_id="muk42/yolov9_streets",
        filename="yolov9c_finetuned_v2.pt") # fine-tuned on selection of city maps

    model = YOLO(yolo_weights)
    

    step = int(tile_size * (1 - overlap))
    all_detections=[]

    total_tiles = 0
    # Calculate total tiles for progress reporting
    for y in range(0, H, step):
        for x in range(0, W, step):
            # Skip small tiles at the edges
            if y + tile_size > H or x + tile_size > W:
                continue
            total_tiles += 1

    processed_tiles = 0

    # Tile the image and run prediction
    for y in range(0, H, step):
        for x in range(0, W, step):
            tile = image[y:y+tile_size, x:x+tile_size]

            if tile.shape[0] < tile_size or tile.shape[1] < tile_size:
                continue

            results= model.predict(source=tile, imgsz=tile_size, conf=confidence_threshold, verbose=False, iou=0.5)
            
            for result in results:
                boxes = result.boxes.xyxy.cpu().numpy()
                scores = result.boxes.conf.cpu().numpy()
                classes = result.boxes.cls.cpu().numpy()

                for box, score, cls in zip(boxes, scores, classes):
                    x1, y1, x2, y2 = box
                    # Shift box coordinates relative to full image
                    x1 += x
                    x2 += x
                    y1 += y
                    y2 += y
                    all_detections.append([x1, y1, x2, y2, float(score), int(cls)])

            processed_tiles += 1
            yield f"Processed tile {processed_tiles} of {total_tiles}"

    # After all tiles are processed, save detections to JSON
    boxes_to_save = [
        {
            "bbox": [float(x1), float(y1), float(x2), float(y2)],
            "score": float(conf),
            "class": int(cls)
        }
        for x1, y1, x2, y2, conf, cls in all_detections
    ]

    
    BOXES_PATH = os.path.join(OUTPUT_DIR,"boxes.json")
    
    with open(BOXES_PATH, "w") as f:
        json.dump(boxes_to_save, f, indent=4)

    yield f"Inference complete."


@spaces.GPU
def run_tile_inference():
    model = SAM("mobile_sam.pt") # sam2.1_l.pt
    Path("tmp/masks").mkdir(parents=True, exist_ok=True)
    with open("tmp/tiles_meta.json", "r") as f:
        tiles_meta = json.load(f)
    for tile in tiles_meta:
        yield f"Processing {tile['idx']}..."
        tile_path = f"tmp/tiles/tile_{tile['idx']}.png"
        out_path = tile_path.replace("tiles", "masks").replace(".png", ".npy")
        
        # skip if already processed
        if Path(out_path).exists():
            continue  


        local_boxes = tile.get('local_boxes', [])
        point_coords = tile.get('point_coords', [])
        point_labels = tile.get('point_labels', [])

        tile_array = np.array(Image.open(tile_path))

        # If there are no boxes and no labels, stop execution
        if not local_boxes and not point_coords and not point_labels:
            yield f"Tile {tile['idx']} has no boxes or points/labels. Stopping inference."
            return

        results = model(tile_array, bboxes=local_boxes,
                        points=point_coords, labels=point_labels)

        
        masks_to_save = [r.masks.data.cpu().numpy() for r in results if r.masks is not None]
        if masks_to_save:
            masks_stack = np.concatenate(masks_to_save, axis=0)  # shape (N, H, W)
            np.save(out_path, masks_stack)


def getSegments(image_path,iou=0.5,c_th=0.75,edge_margin=10):
    """      
            iou for combining bounding boxes
            c_th defined share of the smaller box contained in the larger box for merge
            edge_margin pixel margin for tiles
    """

    yield "Load YOLO boxes.."
    BOXES_PATH = os.path.join(OUTPUT_DIR,"boxes.json")
    with open(BOXES_PATH, "r") as f:
        box_data = json.load(f)
    boxes = [b["bbox"] for b in box_data]
    yield "Prepare tiles..."
    H,W = prepare_tiles(image_path, boxes, tile_size=1024, overlap=50, iou=iou, c_th=c_th, edge_margin=edge_margin)
    yield "Run inference on tiles..."
    for msg in run_tile_inference():
        yield msg
        if "Stopping inference" in msg:
            yield "No labels detected – halting getSegments."
            return
    yield "Marge predicted masks into image..."
    merge_tile_masks(H,W)

    MASK_PATH = os.path.join(OUTPUT_DIR,"mask.tif")
    yield f"{MASK_PATH}"
    

def extractSegments(image_path, min_size=500, margin=100):
    image = cv2.imread(image_path)
    MASK_PATH = os.path.join(OUTPUT_DIR, "mask.tif")
    mask = cv2.imread(MASK_PATH, cv2.IMREAD_UNCHANGED)

    height, width = mask.shape[:2]

    # Get unique labels (excluding background label 0)
    blob_ids = np.unique(mask)
    blob_ids = blob_ids[blob_ids != 0]

    yield f"Found {len(blob_ids)} blobs"

    for blob_id in blob_ids:
        yield f"Processing blob {blob_id}..."
        # Create a binary mask for the current blob
        blob_mask = (mask == blob_id).astype(np.uint8)

        # Skip small blobs
        if np.sum(blob_mask) < min_size:
            continue

        # Find bounding box of the blob (tight box without margins)
        ys, xs = np.where(blob_mask)
        y_min, y_max = ys.min(), ys.max() + 1
        x_min, x_max = xs.min(), xs.max() + 1

        # ---- ORIGINAL (no mask, no margin) ----
        cropped_image_orig = image[y_min:y_max, x_min:x_max]
        BLOB_PATH_ORIG = os.path.join(OUTPUT_DIR, "blobs", f"{blob_id}.png")
        cv2.imwrite(BLOB_PATH_ORIG, cropped_image_orig)

        # ---- MARGINALIZED (with mask/shading) ----
        x_min_m = max(0, x_min - margin)
        y_min_m = max(0, y_min - margin)
        x_max_m = min(width, x_max + margin)
        y_max_m = min(height, y_max + margin)

        cropped_image_margin = image[y_min_m:y_max_m, x_min_m:x_max_m]
        cropped_mask_margin = blob_mask[y_min_m:y_max_m, x_min_m:x_max_m]

        shaded_margin = cropped_image_margin.copy()
        overlay_margin = cropped_image_margin.copy()
        overlay_margin[cropped_mask_margin == 1] = (255, 200, 100)
        shaded_margin = cv2.addWeighted(overlay_margin, 0.35, shaded_margin, 0.65, 0)

        BLOB_PATH_MARGIN = os.path.join(OUTPUT_DIR, "blobs", f"{blob_id}_margin.png")
        cv2.imwrite(BLOB_PATH_MARGIN, shaded_margin)

    yield f"Done."


'''@spaces.GPU(duration=180)
def blobsOCR(image_path):
    yield "Load OCR model.."
    # Load model + processor
    processor = TrOCRProcessor.from_pretrained("microsoft/trocr-base-str")
    model = VisionEncoderDecoderModel.from_pretrained("muk42/trocr_streets")
    image_extensions = (".png")   
    # Device setup
    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
    model.half().to(device) # float16 weights precision
    yield f"Running on {device}..."
    # Open output file for writing
    OCR_PATH = os.path.join(OUTPUT_DIR,"ocr.csv")
    with open(OCR_PATH, "w", encoding="utf-8") as f_out:
        # Process each image
        image_folder = os.path.join(OUTPUT_DIR,"blobs")
        for filename in os.listdir(image_folder):
            if filename.lower().endswith(image_extensions):
                image_path = os.path.join(image_folder, filename)

                try:
                    image = Image.open(image_path).convert("RGB")
                    pixel_values = processor(images=image, return_tensors="pt").pixel_values.to(device)

                    generated_ids = model.generate(pixel_values)
                    generated_text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
                    
                
                    # Write to file
                    name = os.path.splitext(os.path.basename(filename))[0]
                    f_out.write(f'{name},"{generated_text}"\n')
                    yield f"{filename} → {generated_text}"

                except Exception as e:
                    yield f"Error processing {filename}: {e}"'''

@spaces.GPU
def blobsOCR_chunk(image_paths):
    """Run OCR on a list of images (one chunk)."""
    processor, model = load_trocr_model()
    results = []

    # Load all images in the chunk
    images = [Image.open(path).convert("RGB") for path in image_paths]

    # Convert to pixel_values tensor
    pixel_values = processor(images=images, return_tensors="pt", padding=True).pixel_values.to(_trocr_device)

    # Generate text for the whole batch at once
    generated_ids = model.generate(pixel_values)
    texts = processor.batch_decode(generated_ids, skip_special_tokens=True)

    for path, text in zip(image_paths, texts):
        name = os.path.splitext(os.path.basename(path))[0]
        results.append((name, text))

    return results

def blobsOCR_all():
    image_folder = os.path.join(OUTPUT_DIR, "blobs")
    all_files = [os.path.join(image_folder, f) for f in os.listdir(image_folder) if f.endswith(".png") and '_margin' not in f]
    
    OCR_PATH = os.path.join(OUTPUT_DIR,"ocr.csv")
    with open(OCR_PATH, "w", encoding="utf-8") as f_out:
        for chunk in chunkify(all_files, n=16):  # adjust batch size
            yield f"Processing {len(chunk)} images..."
            results = blobsOCR_chunk(chunk)
            for name, text in results:
                f_out.write(f'{name},"{text}"\n')
                yield f"{name} → {text}"


def extractCentroids(image_path):
    GEO_PATH=os.path.join(OUTPUT_DIR,"mask_georef.tif")
    with rasterio.open(GEO_PATH) as src:
        mask = src.read(1)
        transform = src.transform

    labels = np.unique(mask)
    labels = labels[labels != 0]

    data = []

    # Generate polygons and their values
    shapes_gen = rasterio.features.shapes(mask, mask=(mask != 0), transform=transform)

    # Create a dict to collect polygons by label
    polygons_by_label = {}

    for geom, val in shapes_gen:
        if val == 0:
            continue
        polygons_by_label.setdefault(val, []).append(shape(geom))

    # For each label, merge polygons and get centroid
    for idx, label in enumerate(labels):
        yield f"Processing {idx+1} out of {len(labels)}"
        polygons = polygons_by_label.get(label)
        if not polygons:
            continue

        # Merge polygons of the same label (if multiple parts)
        multi_poly = polygons[0]
        for poly in polygons[1:]:
            multi_poly = multi_poly.union(poly)

        centroid = multi_poly.centroid
        data.append({"blob_id": label, "x": centroid.x, "y": centroid.y})

    df = pd.DataFrame(data)
    COORD_PATH=os.path.join(OUTPUT_DIR,"centroids.csv")
    df.to_csv(COORD_PATH, index=False)
    yield f"Saved centroid coordinates of {len(labels)} blobs."


def georefTile(tile_coords, gcp_path):
    yield "Georeferencing SAM image.."

    
    MASK_TILE=os.path.join(OUTPUT_DIR,"mask.tif")
    TMP_TILE=os.path.join(OUTPUT_DIR,"mask_tmp.tif")
    MASK_TILE_GEO=os.path.join(OUTPUT_DIR,"mask_georef.tif")
    
    for f in [TMP_TILE, MASK_TILE_GEO]:
        if os.path.exists(f):
            os.remove(f)

    df = pd.read_csv(gcp_path)

    xmin, ymin, xmax, ymax = tile_coords
    xoff, yoff = xmin, ymin
    xsize, ysize = xmax - xmin, ymax - ymin

    shifted_gcps = []
    for _, r in df.iterrows():
        shifted_gcps.append(
            gdal.GCP(
                float(r['mapX']),
                float(r['mapY']),
                0,
                float(r['sourceX']) - xoff,
                abs(float(r['sourceY'])) - yoff
            )
        )

    gdal.Translate(
        TMP_TILE,
        MASK_TILE,
        format="GTiff",
        GCPs=shifted_gcps,
        outputSRS="EPSG:3857"
    )

    gdal.Warp(
        MASK_TILE_GEO,
        TMP_TILE,
        dstSRS="EPSG:3857",  
        resampleAlg="near", 
        polynomialOrder=1,
        creationOptions=["COMPRESS=LZW"] 
    )

    yield "Done."


def georefImg(image_path, gcp_path, user_crs):

    TMP_FILE = os.path.join(OUTPUT_DIR,"tmp.tif")
    GEO_FILE = os.path.join(OUTPUT_DIR,"georeferenced.tif")
    VRT_FILE = os.path.join(OUTPUT_DIR,"vrt_file.vrt")

    for f in [TMP_FILE, GEO_FILE]:
        if os.path.exists(f):
            os.remove(f)

    yield "Read GCP points..."

    df = pd.read_csv(gcp_path)

    H,W,_ = img_shape(image_path)


    # Build GCPs
    gcps = []
    '''for _, r in df.iterrows():
        gcps.append(
            gdal.GCP(
                float(r['mapX']),    
                float(r['mapY']),
                0,
                float(r['sourceX']), 
                #H-float(r['sourceY']) 
                abs(float(r['sourceY']))
            )
        )'''

    for _, r in df.iterrows():
        gcps.append((
            float(r['mapX']),    
            float(r['mapY']),
            float(r['sourceX']), 
            #H-float(r['sourceY']) 
            abs(float(r['sourceY']))
            ))
        

    # OLD
    '''gdal.Translate(
            TMP_FILE,
            image_path,
            format="GTiff",
            GCPs=gcps,
            outputSRS="EPSG:3857" 
        )'''
    
    yield "Transform GCP to user specified CRS..."

    # Transform GCP from user provided CRS to Web Mercator 3857
    transformer=Transformer.from_crs(f"epsg:{user_crs}","epsg:3857",always_xy=True)
    gcps3857=[]
    for px,py,x,y in gcps:
        x3857,y3857=transformer.transform(px,py)
        gcp=gdal.GCP(x3857,y3857,0,x,y)
        gcps3857.append(gcp)

    yield "Apply GCP to the image..."

    # Apply GCP to the image
    src_ds=gdal.Open(image_path)
    drv=gdal.GetDriverByName('VRT')
    vrt_ds=drv.CreateCopy(VRT_FILE,src_ds,0)

    # Set the GCPs and spatial reference system
    srs3857=osr.SpatialReference()
    srs3857.ImportFromEPSG(3857)
    vrt_ds.SetGCPs(gcps3857,srs3857.ExportToWkt())
    vrt_ds=None # close vrt to save changes


    gdal.Warp(
        GEO_FILE,
        VRT_FILE, # TMP_FILE,
        dstSRS="EPSG:3857",  
        resampleAlg="near", 
        polynomialOrder=1,
        creationOptions=["COMPRESS=LZW"],
        format='GTiff'
    )


    yield "The map is georeferenced."


def extractStreetNet(city_name,user_crs):
    yield f"Extract OSM street network for {city_name}"

    MASK_TILE_GEO=os.path.join(OUTPUT_DIR,"mask_georef.tif")
    
    ds = gdal.Open(MASK_TILE_GEO)
    gt = ds.GetGeoTransform()
    width = ds.RasterXSize
    height = ds.RasterYSize

    minx = gt[0]
    maxy = gt[3]
    maxx = gt[0] + width * gt[1] + height * gt[2]
    miny = gt[3] + width * gt[4] + height * gt[5]

    # Add 100 meters buffer in all directions
    minx -= 100  # west
    maxx += 100  # east
    miny -= 100  # south
    maxy += 100  # north

    bbox = (maxy, miny, maxx, minx) 

        
    transformer = Transformer.from_crs(f"EPSG:{user_crs}", "EPSG:4326", always_xy=True)
    north, south = transformer.transform(bbox[2], bbox[0])[1], transformer.transform(bbox[3], bbox[1])[1]
    east, west   = transformer.transform(bbox[2], bbox[0])[0], transformer.transform(bbox[3], bbox[1])[0]

    bbox = (west, south, east, north)

    G = ox.graph_from_bbox(bbox,network_type='all')
    G_proj = ox.project_graph(G)
    edges = ox.graph_to_gdfs(G_proj, nodes=False, edges=True, fill_edge_geometry=True)
    edges_proj = edges.to_crs(epsg=user_crs)
    edges_proj = edges_proj[['osmid','name', 'geometry']]
    edges_proj = edges_proj[edges_proj['name'].notnull()]

    edges_proj['name'] = edges_proj['name'].apply(
                            lambda x: x[0] if isinstance(x, list) and len(x) > 0 else x)

    OSM_PATH=os.path.join(OUTPUT_DIR,"osm_extract.geojson")
    edges_proj.to_file(OSM_PATH, driver="GeoJSON")
    yield "Done OSM extraction."


def fuzzyMatchHist(hist_dic, hist_th, tile_dict):
    # Convert threshold to numeric
    hist_th = int(hist_th)

    # === Load Data ===
    hist_df = pd.read_csv(hist_dic,header=None, names=["hist_name"])
    OCR_PATH = os.path.join(OUTPUT_DIR, "ocr.csv")

    names_df = pd.read_csv(
        OCR_PATH,
        names=['blob_id', 'pred_text'],
        dtype={"blob_id": "int64", "pred_text": "string"}
    )

    historic_names = hist_df["hist_name"].dropna().astype(str).tolist()

    # === Fuzzy Match ===
    results = []
    for _, row in names_df.iterrows():
        ocr_name = row["pred_text"]
        if pd.isna(ocr_name):
            continue

        best_match, best_score, _ = process.extractOne(
            ocr_name,
            historic_names,
            scorer=fuzz.token_sort_ratio
        )

        results.append({
            "blob_id": row["blob_id"],
            "ocr_name": ocr_name,
            "best_hist_match": best_match,
            "match_score": best_score
        })

    results_df = pd.DataFrame(results)
    tile = tile_dict["tile_path"]
    match = re.search(r'\d+', tile)
    tile_number=int(match.group())
    # === Save all results ===
    all_results_path = os.path.join(OUTPUT_DIR, f"historic_matches_tile{tile_number}.csv")
    results_df.to_csv(all_results_path, index=False)

    # === Filter for manual annotation ===
    manual_df = results_df[results_df["match_score"] >= hist_th]
    for blob_id in manual_df['blob_id']:
        # original blob
        orig_path = os.path.join(OUTPUT_DIR, "blobs", f"{blob_id}.png")
        if os.path.exists(orig_path):
            os.remove(orig_path)

        # marginalized blob
        margin_path = os.path.join(OUTPUT_DIR, "blobs", f"{blob_id}_margin.png")
        if os.path.exists(margin_path):
            os.remove(margin_path)

    yield "Historic fuzzy matching complete."
    yield [all_results_path]


def fuzzyMatch(score_th, tile_dict):
    COORD_PATH = os.path.join(OUTPUT_DIR, "centroids.csv")
    OCR_PATH = os.path.join(OUTPUT_DIR, "ocr.csv")

    coords_df = pd.read_csv(COORD_PATH)
    names_df = pd.read_csv(
        OCR_PATH,
        names=['blob_id', 'pred_text'],
        dtype={"blob_id": "int64", "pred_text": "string"}
    )

    merged_df = coords_df.merge(names_df, on="blob_id")

    gdf = gpd.GeoDataFrame(
        merged_df,
        geometry=gpd.points_from_xy(merged_df.x, merged_df.y),
        crs="EPSG:3857"
    )

    # Add lat lon to the blobs
    # Reproject temporarily to WGS84 for coordinates
    gdf_ll = gdf.to_crs(epsg=4326)

    # Add longitude/latitude columns to the original gdf
    gdf['lon'] = gdf_ll.geometry.x
    gdf['lat'] = gdf_ll.geometry.y

    OSM_PATH = os.path.join(OUTPUT_DIR, "osm_extract.geojson")
    osm_gdf = gpd.read_file(OSM_PATH, dtype={"name": "str"})
    osm_gdf["name"] = osm_gdf["name"].str.replace("strasse", "", case=False, regex=False)

   
    # Build spatial index for fast nearest lookup
    osm_sindex = osm_gdf.sindex

    yield "Process OSM candidates..."
    results = []

    for _, row in gdf.iterrows():

        geom = row.geometry
        if isinstance(geom, gpd.GeoSeries):
            geom = geom.iloc[0]

        # Levenshtein-based fuzzy matching
        match = best_street_match(geom, row['pred_text'], osm_gdf, max_distance=100)

        # Closest OSM street geometrically
        nearest_idx, nearest_dist = osm_sindex.nearest(geom, return_all=False,return_distance=True)

        #closest_geom = osm_gdf.geometry.iloc[nearest_idx[1]]
        closest_name = osm_gdf.name.iloc[nearest_idx[1]].values[0]

        results.append({
            "blob_id": row.blob_id,
            "lon": row.lon,
            "lat": row.lat,
            "blob_name": row.pred_text,
            "best_osm_match": match[0] if match else None,
            "osm_match_score": match[1] if match else 0,
            "closest_osm_street": closest_name,
            "closest_osm_distance_m": nearest_dist[0]
        })

    results_df = pd.DataFrame(results)

    # Save results
    tile = tile_dict["tile_path"]
    match = re.search(r'\d+', tile)
    tile_number = int(match.group())

    RES_PATH = os.path.join(OUTPUT_DIR, f"street_matches_tile{tile_number}.csv")
    results_df.to_csv(RES_PATH, index=False)

    # Export OSM layer as CSV
    osm_gdf = osm_gdf.to_crs(epsg=4326)
    OSM_CSV_PATH = os.path.join(OUTPUT_DIR, f"osm_extract_tile{tile_number}.csv")
    osm_export_df = osm_gdf[["name", "geometry"]].copy()
    osm_export_df["geometry"] = osm_export_df["geometry"].apply(lambda g: g.wkt)
    osm_export_df.to_csv(OSM_CSV_PATH, index=False)

    # Remove blobs above score threshold
    manual_df = results_df[results_df['osm_match_score'] >= int(score_th)]

    for blob_id in manual_df['blob_id']:
        orig_path = os.path.join(OUTPUT_DIR, "blobs", f"{blob_id}.png")
        if os.path.exists(orig_path):
            os.remove(orig_path)

        margin_path = os.path.join(OUTPUT_DIR, "blobs", f"{blob_id}_margin.png")
        if os.path.exists(margin_path):
            os.remove(margin_path)

    yield [RES_PATH, OSM_CSV_PATH]