diff --git a/Dockerfile b/Dockerfile
new file mode 100644
index 0000000..cc7897a
--- /dev/null
+++ b/Dockerfile
@@ -0,0 +1,32 @@
+FROM pytorch/pytorch:2.1.2-cuda11.8-cudnn8-runtime
+
+ENV DEBIAN_FRONTEND=noninteractive 
+
+# Install system dependencies
+RUN apt-get update && apt-get install -y \
+    build-essential \
+    curl \
+    software-properties-common \
+    git \
+    wget \
+    && rm -rf /var/lib/apt/lists/*
+
+# Set working directory
+WORKDIR /opt/program
+
+# Copy environment file
+COPY environment.yml .
+
+# Create conda environment
+RUN conda env create -f environment.yml && \
+    conda clean -afy
+
+# Copy the model code
+COPY . .
+
+# Set environment variables
+ENV PYTHONPATH=/opt/program
+ENV OPENBLAS_NUM_THREADS=1
+
+# Use the startup script as entrypoint
+ENTRYPOINT ["./start_api.sh"] 
\ No newline at end of file
diff --git a/README.md b/README.md
index c7bf052..051f4a7 100644
--- a/README.md
+++ b/README.md
@@ -166,3 +166,78 @@ This repository benefits from the following open-source work. We thank the autho
 3. [Frame Field Learning](https://github.com/Lydorn/Polygonization-by-Frame-Field-Learning)
 4. [PolyWorld](https://github.com/zorzi-s/PolyWorldPretrainedNetwork)
 5. [HiSup](https://github.com/SarahwXU/HiSup)
+
+## Docker Usage
+
+Pix2Poly provides a Docker setup for easy deployment and inference. The Docker container includes a FastAPI server for REST API inference and supports command-line inference.  The API request and response format are suitable for running as a AWS Sagemaker inference endpoint running on a ml.g4dn.xlarge and the inference AMI version al2-ami-sagemaker-inference-gpu-3-1, where it is able to infer at a rate of 5-10 seconds per tile.
+
+### Building the Docker Image
+
+```bash
+docker buildx build --platform linux/amd64 -t pix2poly .
+```
+
+### Running the API Server
+
+The Docker container automatically starts a FastAPI server on port 8080. You can run it with:
+
+```bash
+docker run -p 8080:8080 pix2poly
+```
+
+The API server will automatically download the pretrained model files on first startup and provide the following endpoints:
+
+- `POST /invocations` - Main inference endpoint for processing images
+- `GET /ping` - Health check endpoint
+
+#### API Usage
+
+The `/invocations` endpoint accepts images in multiple formats:
+
+1. **File Upload (multipart/form-data):**
+```bash
+curl -X POST "http://localhost:8080/invocations" \
+     -H "Content-Type: multipart/form-data" \
+     -F "file=@your_image.jpg"
+```
+
+2. **Base64 Encoded Image:**
+```bash
+curl -X POST "http://localhost:8080/invocations" \
+     -H "Content-Type: application/json" \
+     -d '{"image": "base64_encoded_image_data"}'
+```
+
+3. **Raw Image Data:**
+```bash
+curl -X POST "http://localhost:8080/invocations" \
+     -H "Content-Type: image/jpeg" \
+     --data-binary @your_image.jpg
+```
+
+The API returns JSON with the detected polygons:
+
+```text
+{
+  "polygons": [
+    [[x1, y1], [x2, y2], ...],
+    ...
+  ]
+}
+```
+
+### Environment Variables
+
+You can customize the Docker container behavior with these environment variables:
+
+- `MODEL_URL`: URL to download the pretrained model files (default: `https://github.com/safelease/Pix2Poly/releases/download/main/runs_share.zip`)
+- `API_KEY`: Optional API key for authentication (if not set, authentication is disabled)
+
+Example with custom configuration:
+```bash
+docker run -p 8080:8080 \
+  -e MODEL_URL=https://github.com/safelease/Pix2Poly/releases/download/main/runs_share.zip \
+  -e API_KEY=your_secret_key \
+  pix2poly
+```
+
diff --git a/api.py b/api.py
new file mode 100644
index 0000000..8ebb711
--- /dev/null
+++ b/api.py
@@ -0,0 +1,356 @@
+import os
+import json
+import hashlib
+import tempfile
+from fastapi import FastAPI, UploadFile, HTTPException, Request, Depends, Query
+from fastapi.responses import JSONResponse
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.security import APIKeyHeader
+import uvicorn
+from contextlib import asynccontextmanager
+import base64
+from typing import Optional
+import requests
+import shutil
+from pathlib import Path
+from diskcache import Cache
+import re
+
+from polygon_inference import PolygonInference
+from utils import log
+
+# API Key configuration
+API_KEY_NAME = "X-API-Key"
+api_key_header = APIKeyHeader(name=API_KEY_NAME, auto_error=False)
+
+# Get API key from environment variable
+API_KEY = os.getenv("API_KEY")
+MODEL_URL = os.getenv("MODEL_URL", "https://github.com/safelease/Pix2Poly/releases/download/main/runs_share.zip")
+
+# Default model name (inria dataset)
+DEFAULT_MODEL_NAME = "Pix2Poly_inria_coco_224"
+
+# Cache configuration
+CACHE_TTL = int(os.getenv("CACHE_TTL", 24 * 3600))  # 24 hours
+
+# Global cache instance
+cache = Cache(
+    directory=os.path.join(tempfile.gettempdir(), "pix2poly_cache"),
+    timeout=1,  # 1 second timeout for cache operations
+    disk_min_file_size=0,  # Store all items on disk
+    disk_pickle_protocol=4,  # Use protocol 4 for better compatibility
+)
+
+def get_cache_key(image_data: bytes, model_name: str = None, merge_tolerance: float = None, tile_overlap_ratio: float = None) -> str:
+    """Generate a cache key from image data and parameters.
+    
+    Args:
+        image_data: Raw image data
+        model_name: Model name being used
+        merge_tolerance: Merge tolerance parameter
+        tile_overlap_ratio: Tile overlap ratio parameter
+        
+    Returns:
+        SHA-256 hash of the image data combined with parameters as a string
+    """
+    image_hash = hashlib.sha256(image_data).hexdigest()
+    return f"{image_hash}_{model_name}_{merge_tolerance}_{tile_overlap_ratio}"
+
+
+def validate_model_name(model_name: str) -> bool:
+    """Validate that the model name contains only safe characters.
+    
+    Args:
+        model_name: The model name to validate
+        
+    Returns:
+        True if the model name is valid, False otherwise
+    """
+    # Allow alphanumeric characters, underscores, and hyphens
+    return bool(re.match(r'^[a-zA-Z0-9_-]+$', model_name))
+
+
+async def verify_api_key(
+    header_key: Optional[str] = Depends(api_key_header),
+    query_key: Optional[str] = Query(None, alias="api_key"),
+) -> Optional[str]:
+    """Verify the API key from either header or query parameter.
+
+    If API authentication is not enabled (no API key configured),
+    this function will always return None.
+
+    Args:
+        header_key: API key from X-API-Key header
+        query_key: API key from api_key query parameter
+
+    Returns:
+        The verified API key or None if authentication is disabled
+
+    Raises:
+        HTTPException: 401 if API key is missing (when required)
+        HTTPException: 403 if API key is invalid (when required)
+    """
+    if not API_KEY:
+        return None
+
+    api_key = header_key or query_key
+    if not api_key:
+        raise HTTPException(status_code=401, detail="API key is missing")
+    if api_key != API_KEY:
+        raise HTTPException(status_code=403, detail="Invalid API key")
+    return api_key
+
+
+def download_model_files(model_url: str, target_dir: str) -> str:
+    """Download model files to the target directory.
+
+    Args:
+        model_url: URL to download the model files from
+        target_dir: Directory to save the model files to
+
+    Returns:
+        Path to the downloaded model directory
+
+    Raises:
+        ValueError: If download fails or model files are invalid
+    """
+    # Create target directory if it doesn't exist
+    target_path = Path(target_dir)
+    target_path.mkdir(parents=True, exist_ok=True)
+
+    # Check if model files already exist
+    if target_path.exists() and any(target_path.iterdir()):
+        log(f"Model files already exist in {target_dir}, skipping download", "INFO")
+        return str(target_path)
+
+    # Download the model files using requests
+    zip_path = target_path / "runs_share.zip"
+    
+    log(f"Downloading model files from {model_url}", "INFO")
+    response = requests.get(model_url, stream=True)
+    response.raise_for_status()
+    
+    with open(zip_path, 'wb') as f:
+        for chunk in response.iter_content(chunk_size=8192):
+            f.write(chunk)
+
+    # Extract the zip file
+    log(f"Extracting model files to {target_dir}", "INFO")
+    shutil.unpack_archive(zip_path, target_path)
+
+    # Remove the zip file
+    zip_path.unlink()
+
+    return str(target_path)
+
+
+@asynccontextmanager
+async def lifespan(app: FastAPI):
+    """Initialize the predictor on startup."""
+    global model_dir
+    
+    # Download model files to a temporary directory
+    model_dir = download_model_files(
+        MODEL_URL,
+        "/tmp/pix2poly_model",
+    )
+
+    # Initialize predictor with downloaded model using the default model name
+    init_predictor(os.path.join(model_dir, "runs_share", DEFAULT_MODEL_NAME), DEFAULT_MODEL_NAME)
+    yield
+
+
+app = FastAPI(
+    title="Polygon Inference API",
+    description="API for inferring polygons in images using a trained model",
+    version="1.0.0",
+    lifespan=lifespan,
+)
+
+# Add CORS middleware
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],  # Allows all origins
+    allow_credentials=True,
+    allow_methods=["*"],  # Allows all methods
+    allow_headers=["*"],  # Allows all headers
+)
+
+# Global predictor instance and current model tracking
+predictor = None
+current_model_name = None
+model_dir = None
+
+
+def init_predictor(experiment_path: str, model_name: str = None):
+    """Initialize the global predictor instance."""
+    global predictor, current_model_name
+    if predictor is None or current_model_name != model_name:
+        predictor = PolygonInference(experiment_path)
+        current_model_name = model_name
+        log(f"Loaded model: {model_name}", "INFO")
+
+
+def load_model(model_name: str):
+    """Load a specific model by name.
+    
+    Args:
+        model_name: The name of the model to load (e.g., "Pix2Poly_inria_coco_224")
+        
+    Raises:
+        HTTPException: If model name is invalid or model files don't exist
+    """
+    global predictor, current_model_name, model_dir
+
+    log(f"Using model: {model_name}")
+    
+    if not validate_model_name(model_name):
+        raise HTTPException(status_code=400, detail="Invalid model name. Only alphanumeric characters, underscores, and hyphens are allowed.")
+    
+    # Skip reloading if it's the same model
+    if current_model_name == model_name and predictor is not None:
+        return
+    
+    # Construct the full experiment path
+    experiment_path = os.path.join(model_dir, "runs_share", model_name)
+    
+    # Check if the model directory exists
+    if not os.path.exists(experiment_path):
+        raise HTTPException(status_code=404, detail=f"Model '{model_name}' not found in downloaded model files")
+    
+    # Initialize the predictor with the new model
+    init_predictor(experiment_path, model_name)
+
+
+@app.post("/invocations")
+async def invoke(
+    request: Request,
+    file: UploadFile = None,
+    api_key: Optional[str] = Depends(verify_api_key),
+    merge_tolerance: Optional[float] = Query(None, description="Tolerance for point-in-polygon tests during validation (in pixels, allows points to be slightly outside)"),
+    tile_overlap_ratio: Optional[float] = Query(None, description="Overlap ratio between tiles (0.0 = no overlap, 1.0 = complete overlap)"),
+    model_name: Optional[str] = Query(None, description="Name of the model to use (e.g., 'Pix2Poly_inria_coco_224')"),
+):
+    """Main inference endpoint for processing images.
+
+    The endpoint accepts image data in three different ways:
+    1. As a file upload using multipart/form-data (via the file parameter)
+    2. As a base64-encoded image in a JSON payload with an 'image' field
+    3. As raw image data in the request body
+
+    Authentication can be provided in two ways:
+    1. Via the X-API-Key header
+    2. Via the api_key query parameter
+
+    Configuration parameters can be provided in two ways:
+    1. Via query parameters (merge_tolerance, tile_overlap_ratio, model_name)
+    2. Via the JSON payload fields (merge_tolerance, tile_overlap_ratio, model_name)
+
+    Args:
+        request: The request containing the image data
+        file: Optional uploaded file (multipart/form-data)
+        api_key: Optional API key for authentication (required only if API key is configured)
+        merge_tolerance: Optional tolerance for point-in-polygon tests during validation (in pixels, allows points to be slightly outside)
+        tile_overlap_ratio: Optional overlap ratio between tiles (0.0 = no overlap, 1.0 = complete overlap)
+        model_name: Optional name of the model to use (e.g., 'Pix2Poly_inria_coco_224')
+
+    Returns:
+        JSON response containing the inferred polygons
+
+    Raises:
+        HTTPException: 400 if no image data is found in the request
+        HTTPException: 404 if the specified model is not found
+        HTTPException: 500 if there is an error processing the image
+        HTTPException: 401 if API key is missing (when API key is configured)
+        HTTPException: 403 if API key is invalid (when API key is configured)
+    """
+    log(f"Invoking image analysis")
+
+    # Initialize configuration parameters and validate ranges
+    effective_merge_tolerance = merge_tolerance
+    effective_tile_overlap_ratio = tile_overlap_ratio
+    effective_model_name = model_name or DEFAULT_MODEL_NAME
+    
+    # Validate merge_tolerance (should be positive)
+    if effective_merge_tolerance is not None and effective_merge_tolerance < 0:
+        raise HTTPException(status_code=400, detail="merge_tolerance must be non-negative")
+    
+    # Validate tile_overlap_ratio (should be between 0.0 and 1.0)
+    if effective_tile_overlap_ratio is not None and (effective_tile_overlap_ratio < 0.0 or effective_tile_overlap_ratio > 1.0):
+        raise HTTPException(status_code=400, detail="tile_overlap_ratio must be between 0.0 and 1.0")
+
+    if file:
+        # Handle file upload
+        image_data = await file.read()
+    else:
+        # Read request body
+        body = await request.body()
+
+        # Parse the request body
+        try:
+            data = json.loads(body)
+            if "image" in data:
+                # Handle base64 encoded image
+                image_data = base64.b64decode(data["image"])
+                
+                # Extract configuration parameters from JSON (if query params not provided)
+                if effective_merge_tolerance is None and "merge_tolerance" in data:
+                    effective_merge_tolerance = float(data["merge_tolerance"])
+                    if effective_merge_tolerance < 0:
+                        raise HTTPException(status_code=400, detail="merge_tolerance must be non-negative")
+                if effective_tile_overlap_ratio is None and "tile_overlap_ratio" in data:
+                    effective_tile_overlap_ratio = float(data["tile_overlap_ratio"])
+                    if effective_tile_overlap_ratio < 0.0 or effective_tile_overlap_ratio > 1.0:
+                        raise HTTPException(status_code=400, detail="tile_overlap_ratio must be between 0.0 and 1.0")
+                if model_name is None and "model_name" in data:
+                    effective_model_name = str(data["model_name"])
+            else:
+                raise HTTPException(
+                    status_code=400, detail="No image data found in request"
+                )
+        except json.JSONDecodeError:
+            # Handle raw image data
+            image_data = body
+
+    # Load the requested model (this will only reload if it's different from the current model)
+    load_model(effective_model_name)
+
+    # Generate cache key including all configuration parameters
+    cache_key = get_cache_key(image_data, effective_model_name, effective_merge_tolerance, effective_tile_overlap_ratio)
+    cached_result = cache.get(cache_key)
+    
+    if cached_result is not None:
+        return JSONResponse(content=cached_result)
+
+    # Get inferences
+    polygons = predictor.infer(image_data, merge_tolerance=effective_merge_tolerance, tile_overlap_ratio=effective_tile_overlap_ratio)
+
+    # Prepare response
+    response = {
+        "polygons": polygons,
+        "model_name": effective_model_name,
+    }
+
+    # Store result in cache
+    cache.set(cache_key, response, expire=CACHE_TTL)
+
+    return JSONResponse(content=response)
+
+@app.get("/ping")
+async def ping(api_key: Optional[str] = Depends(verify_api_key)):
+    """Health check endpoint to verify service status."""
+    if predictor is None:
+        raise HTTPException(status_code=503, detail="Model not loaded")
+    return {"status": "healthy"}
+
+
+@app.get("/clear-cache")
+async def clear_cache(api_key: Optional[str] = Depends(verify_api_key)):
+    """Clear the cache endpoint to remove all cached results."""
+    cache.clear()
+    return {"status": "success", "message": "Cache cleared successfully"}
+
+
+if __name__ == "__main__":
+    # Run the API
+    uvicorn.run(app, host="0.0.0.0", port=8080)
diff --git a/config.py b/config.py
index f63a61b..0c2ddf5 100644
--- a/config.py
+++ b/config.py
@@ -56,6 +56,28 @@ class CFG:
     perm_loss_weight = 10.0
     SHUFFLE_TOKENS = False  # order gt vertex tokens randomly every time
 
+    # Tiling configuration
+    TILE_SIZE = IMG_SIZE
+    TILE_OVERLAP = 34
+
+    # Polygon filtering configuration
+    # MIN_POLYGON_AREA: Minimum area in square pixels for a polygon to be considered valid
+    # Conversion: 100 sq ft ≈ 9.29 sq meters
+    # Since 1 pixel = 0.3m, 1 sq pixel = 0.09 sq meters
+    # Therefore, 9.29 sq meters ≈ 103 sq pixels
+    MIN_POLYGON_AREA = 103
+
+    # POLYGON_SIMPLIFICATION_TOLERANCE: Maximum distance in pixels that a point can be moved during polygon simplification
+    # A pixel is 0.3m, so 2 pixels is 0.6m, or 2 feet, which should be of no consequence
+    POLYGON_SIMPLIFICATION_TOLERANCE = 2
+
+    # Prediction configuration
+    PREDICTION_BATCH_SIZE = 8  # Batch size for processing tiles during prediction
+    
+    # Polygon validation configuration
+    MERGE_TOLERANCE = 2  # Tolerance for point-in-polygon tests during validation (in pixels, allows points to be slightly outside)
+    TILE_OVERLAP_RATIO = 0.5  # Overlap ratio between tiles (0.0 = no overlap, 1.0 = complete overlap)
+    
     BATCH_SIZE = 24  # batch size per gpu; effective batch size = BATCH_SIZE * NUM_GPUs
     START_EPOCH = 0
     NUM_EPOCHS = 500
@@ -65,7 +87,7 @@ class CFG:
     SAVE_EVERY = 10
     VAL_EVERY = 1
 
-    MODEL_NAME = f'vit_small_patch{PATCH_SIZE}_{INPUT_SIZE}_dino'
+    MODEL_NAME = f'vit_small_patch{PATCH_SIZE}_{INPUT_SIZE}.dino'
     NUM_PATCHES = int((INPUT_SIZE // PATCH_SIZE) ** 2)
 
     LR = 4e-4
diff --git a/environment.yml b/environment.yml
new file mode 100644
index 0000000..2aec210
--- /dev/null
+++ b/environment.yml
@@ -0,0 +1,34 @@
+name: pix2poly
+channels:
+  - conda-forge
+  - pytorch
+  - nvidia
+dependencies:
+  - python=3.11
+  - timm=0.9.12
+  - transformers=4.32.1
+  - pycocotools>=2.0.6
+  - torchmetrics=1.2.1
+  - tensorboard=2.15.1
+  - buildingregulariser>=0.2.2
+  - geopandas=1.1.1
+  - pip
+  - pip:
+    - torch==2.1.2
+    - torchvision==0.16.2
+    - torchaudio==2.1.2
+    - albumentations==1.3.1
+    - imageio==2.33.1
+    - matplotlib-inline==0.1.6
+    - opencv-python-headless==4.8.1.78
+    - scikit-image==0.22.0
+    - scikit-learn==1.3.2
+    - scipy==1.11.4
+    - shapely==2.0.4
+    - fastapi>=0.68.0
+    - uvicorn>=0.15.0
+    - python-multipart>=0.0.5
+    - tqdm>=4.62.0
+    - diskcache>=5.6.0
+    - huggingface-hub>=0.15.1,<1.0
+  
\ No newline at end of file
diff --git a/infer_single_image.py b/infer_single_image.py
new file mode 100644
index 0000000..5454619
--- /dev/null
+++ b/infer_single_image.py
@@ -0,0 +1,72 @@
+import os
+import json
+import numpy as np
+import cv2
+import matplotlib.pyplot as plt 
+import argparse
+import sys
+
+from polygon_inference import PolygonInference
+from utils import log
+
+parser = argparse.ArgumentParser()
+parser.add_argument("-e", "--experiment_path", help="path to experiment folder to evaluate")
+args = parser.parse_args()
+
+def main():
+    # Load image from stdin
+    image_data = sys.stdin.buffer.read()
+
+    # Initialize inference
+    inference = PolygonInference(args.experiment_path)
+    
+    # Get inference results
+    polygons_list = inference.infer(image_data, debug=True)
+
+    # Decode image for visualization
+    nparr = np.frombuffer(image_data, np.uint8)
+    image = cv2.imdecode(nparr, cv2.IMREAD_COLOR)
+    if image is None:
+        log("Failed to load image from stdin", "ERROR")
+        return
+
+    # Get image dimensions
+    height, width = image.shape[:2]
+    
+    # Create figure with exact image dimensions
+    plt.figure(figsize=(width/100, height/100), dpi=100)
+    
+    # Plot merged result
+    vis_image_merged = image.copy()
+    formatted_contours = [np.array(cnt).reshape(-1, 1, 2).astype(np.int32) for cnt in polygons_list]
+    cv2.drawContours(vis_image_merged, formatted_contours, -1, (0, 255, 0), 1)
+    
+    # Draw dots at vertices for merged result
+    for contour in formatted_contours:
+        for point in contour:
+            x, y = point[0]
+            # Draw 2x2 red square.
+            y_min = max(0, y-1)
+            y_max = min(height, y+1)
+            x_min = max(0, x-1)
+            x_max = min(width, x+1)
+            vis_image_merged[y_min:y_max, x_min:x_max] = [255, 0, 0]
+    
+    # Convert BGR to RGB for correct display in matplotlib
+    vis_image_merged_rgb = cv2.cvtColor(vis_image_merged, cv2.COLOR_BGR2RGB)
+    plt.imshow(vis_image_merged_rgb)
+    plt.axis('off')
+    plt.subplots_adjust(left=0, right=1, top=1, bottom=0)
+
+    # Save visualization
+    output_path = os.path.join(f"visualization.png")
+    plt.savefig(output_path, dpi=100, bbox_inches='tight', pad_inches=0)
+    plt.close()
+
+    log(f"Saved main visualization to {output_path}")
+
+    # Print polygons to stdout
+    print(json.dumps(polygons_list))
+
+if __name__ == "__main__":
+    main() 
\ No newline at end of file
diff --git a/models/model.py b/models/model.py
index db396cb..5233679 100644
--- a/models/model.py
+++ b/models/model.py
@@ -11,6 +11,7 @@
 from config import CFG
 from utils import (
     create_mask,
+    log
 )
 
 
@@ -128,7 +129,7 @@ def __init__(self, cfg, vocab_size, encoder_len, dim, num_heads, num_layers):
     def init_weights(self):
         for name, p in self.named_parameters():
             if 'encoder_pos_embed' in name or 'decoder_pos_embed' in name:
-                print(f"Skipping initialization of pos embed layers...")
+                log("Skipping initialization of pos embed layers...")
                 continue
             if p.dim() > 1:
                 nn.init.xavier_uniform_(p)
@@ -269,16 +270,15 @@ def predict(self, image, tgt):
     with torch.no_grad():
         for i in range(1 + n_vertices*2):
             try:
-                print(i)
+                log(f"Iteration {i}")
                 preds_p, feats_p = model.predict(image, batch_preds)
-                # print(preds_p.shape, feats_p.shape)
                 if i % 2 == 0:
                     confs_ = torch.softmax(preds_p, dim=-1).sort(axis=-1, descending=True)[0][:, 0].cpu()
                     confs.append(confs_)
                 preds_p = sample(preds_p)
                 batch_preds = torch.cat([batch_preds, preds_p], dim=1)
             except:
-                print(f"Error at iteration: {i}")
+                log(f"Error at iteration: {i}")
         perm_pred = model.scorenet(feats_p)
 
         # Postprocessing.
@@ -302,18 +302,18 @@ def predict(self, image, tgt):
         out_coords.extend(all_coords)
         out_confs.extend(out_confs)
 
-    print(f"preds_f shape: {preds_f.shape}")
-    print(f"preds_f grad: {preds_f.requires_grad}")
-    print(f"preds_f min: {preds_f.min()}, max: {preds_f.max()}")
+    log(f"preds_f shape: {preds_f.shape}")
+    log(f"preds_f grad: {preds_f.requires_grad}")
+    log(f"preds_f min: {preds_f.min()}, max: {preds_f.max()}")
 
-    print(f"perm_mat shape: {perm_mat.shape}")
-    print(f"perm_mat grad: {perm_mat.requires_grad}")
-    print(f"perm_mat min: {perm_mat.min()}, max: {preds_f.max()}")
+    log(f"perm_mat shape: {perm_mat.shape}")
+    log(f"perm_mat grad: {perm_mat.requires_grad}")
+    log(f"perm_mat min: {perm_mat.min()}, max: {preds_f.max()}")
 
-    print(f"batch_preds shape: {batch_preds.shape}")
-    print(f"batch_preds grad: {batch_preds.requires_grad}")
-    print(f"batch_preds min: {batch_preds.min()}, max: {batch_preds.max()}")
+    log(f"batch_preds shape: {batch_preds.shape}")
+    log(f"batch_preds grad: {batch_preds.requires_grad}")
+    log(f"batch_preds min: {batch_preds.min()}, max: {batch_preds.max()}")
 
-    print(f"loss : {loss}")
-    print(f"loss grad: {loss.requires_grad}")
+    log(f"loss : {loss}")
+    log(f"loss grad: {loss.requires_grad}")
 
diff --git a/polygon_inference.py b/polygon_inference.py
new file mode 100644
index 0000000..d0daa8d
--- /dev/null
+++ b/polygon_inference.py
@@ -0,0 +1,1075 @@
+# Standard library imports
+import os
+import time
+import hashlib
+import pickle
+import copy
+from typing import List, Tuple, Dict, Optional, Union, Any
+
+# Third-party imports
+import numpy as np
+import numpy.typing as npt
+import cv2
+import torch
+import albumentations as A
+from albumentations.pytorch import ToTensorV2
+from shapely.geometry import Polygon
+from shapely.validation import make_valid
+from buildingregulariser import regularize_geodataframe
+import geopandas as gpd
+
+import matplotlib.pyplot as plt
+import math
+
+# Local imports
+from config import CFG
+from tokenizer import Tokenizer
+from utils import (
+    seed_everything,
+    test_generate,
+    postprocess,
+    permutations_to_polygons,
+    log,
+    calculate_slice_bboxes,
+)
+from models.model import Encoder, Decoder, EncoderDecoder
+
+# Type aliases for better readability
+PolygonArray = npt.NDArray[np.floating[Any]]
+TilePosition = Tuple[int, int, int, int]  # (x, y, x_end, y_end)
+TileResult = Dict[str, Union[List[PolygonArray], List[bool]]]
+Point2D = Tuple[float, float]
+BoundingBox = Tuple[float, float, float, float]  # (x_min, y_min, x_max, y_max)
+
+
+class PolygonInference:
+    def __init__(self, experiment_path: str, device: Optional[str] = None) -> None:
+        """Initialize the polygon inference with a trained model.
+
+        Args:
+            experiment_path (str): Path to the experiment folder containing the model checkpoint
+            device (str | None, optional): Device to run the model on. Defaults to CFG.DEVICE
+        """
+        self.device: str = device or CFG.DEVICE
+        self.experiment_path: str = os.path.realpath(experiment_path)
+        self.model: Optional[EncoderDecoder] = None
+        self.tokenizer: Optional[Tokenizer] = None
+        self.cache_dir: str = "/tmp/pix2poly_cache"
+        # Extract descriptive model name from experiment path (e.g., "Pix2Poly_inria_coco_224")
+        self.model_display_name: str = os.path.basename(self.experiment_path)
+        self.model_cfg: Optional[Any] = None  # Store adapted configuration
+        self._ensure_cache_dir()
+        self._initialize_model()
+
+    def _ensure_cache_dir(self) -> None:
+        """Ensure the cache directory exists."""
+        os.makedirs(self.cache_dir, exist_ok=True)
+
+    def _generate_cache_key(self, tiles: List[npt.NDArray[np.uint8]]) -> str:
+        """Generate a cache key based on the input tiles and model.
+        
+        Args:
+            tiles (List[npt.NDArray[np.uint8]]): List of tile images
+            
+        Returns:
+            str: Hash-based cache key
+        """
+        # Create a hash based on all tile data and model identifier
+        hasher: hashlib.sha256 = hashlib.sha256()
+        # Include model experiment path to make cache model-specific
+        hasher.update(self.experiment_path.encode('utf-8'))
+        for tile in tiles:
+            hasher.update(tile.tobytes())
+        return hasher.hexdigest()
+
+    def _get_cache_path(self, cache_key: str) -> str:
+        """Get the full path for a cache file.
+        
+        Args:
+            cache_key (str): The cache key
+            
+        Returns:
+            str: Full path to the cache file
+        """
+        return os.path.join(self.cache_dir, f"{cache_key}.pkl")
+
+    def _load_from_cache(self, cache_key: str) -> Optional[List[TileResult]]:
+        """Load results from cache if they exist.
+        
+        Args:
+            cache_key (str): The cache key to look for
+            
+        Returns:
+            Optional[List[TileResult]]: Cached results if found, None otherwise
+        """
+        cache_path: str = self._get_cache_path(cache_key)
+        if os.path.exists(cache_path):
+            try:
+                with open(cache_path, 'rb') as f:
+                    cached_data: Any = pickle.load(f)
+                    return cached_data
+            except Exception as e:
+                log(f"Failed to load cache from {cache_path}: {e}")
+                # Remove corrupted cache file
+                try:
+                    os.remove(cache_path)
+                except:
+                    pass
+        return None
+
+    def _save_to_cache(self, cache_key: str, results: List[TileResult]) -> None:
+        """Save results to cache.
+        
+        Args:
+            cache_key (str): The cache key
+            results (List[TileResult]): Results to cache
+        """
+        cache_path: str = self._get_cache_path(cache_key)
+        try:
+            with open(cache_path, 'wb') as f:
+                pickle.dump(results, f)
+        except Exception as e:
+            log(f"Failed to save cache to {cache_path}: {e}")
+
+    def _check_polygon_overlap(self, poly1: PolygonArray, poly2: PolygonArray) -> bool:
+        """Check if two polygons overlap using Shapely.
+        
+        Args:
+            poly1 (PolygonArray): First polygon as array of [x, y] coordinates
+            poly2 (PolygonArray): Second polygon as array of [x, y] coordinates
+            
+        Returns:
+            bool: True if polygons overlap (intersect but don't just touch)
+        """
+        try:
+            # Convert numpy arrays to Shapely polygons
+            if len(poly1) < 3 or len(poly2) < 3:
+                return False
+            
+            shapely_poly1: Polygon = Polygon(poly1)
+            shapely_poly2: Polygon = Polygon(poly2)
+            
+            # Check if polygons are valid
+            if not shapely_poly1.is_valid or not shapely_poly2.is_valid:
+                return False
+            
+            # Check for intersection (but not just touching)
+            return shapely_poly1.intersects(shapely_poly2) and not shapely_poly1.touches(shapely_poly2)
+        except:
+            return False
+
+    def _calculate_polygon_area(self, poly: PolygonArray) -> float:
+        """Calculate the area of a polygon.
+        
+        Args:
+            poly (PolygonArray): Polygon as array of [x, y] coordinates
+            
+        Returns:
+            float: Area of the polygon, 0 if invalid
+        """
+        try:
+            if len(poly) < 3:
+                return 0.0
+            shapely_poly: Polygon = Polygon(poly)
+            if not shapely_poly.is_valid:
+                return 0.0
+            return float(shapely_poly.area)
+        except:
+            return 0.0
+
+    def _is_edge_near_tile_boundary(
+        self, 
+        p1: Point2D, 
+        p2: Point2D, 
+        tile_bounds: BoundingBox, 
+        tolerance: float = 2.0
+    ) -> bool:
+        """Check if an edge is colinear with the tile boundary within tolerance.
+        
+        Args:
+            p1 (Point2D): First point of the edge
+            p2 (Point2D): Second point of the edge
+            tile_bounds (BoundingBox): Tile boundaries as (x_min, y_min, x_max, y_max)
+            tolerance (float): Tolerance for boundary detection in pixels
+            
+        Returns:
+            bool: True if edge is near a tile boundary
+        """
+        x_min, y_min, x_max, y_max = tile_bounds
+        x1, y1 = p1
+        x2, y2 = p2
+        
+        # Check if edge is roughly horizontal and colinear with top boundary
+        if (abs(y1 - y_min) <= tolerance and abs(y2 - y_min) <= tolerance and
+            abs(y1 - y2) <= tolerance):
+            return True
+        
+        # Check if edge is roughly horizontal and colinear with bottom boundary  
+        if (abs(y1 - y_max) <= tolerance and abs(y2 - y_max) <= tolerance and
+            abs(y1 - y2) <= tolerance):
+            return True
+        
+        # Check if edge is roughly vertical and colinear with left boundary
+        if (abs(x1 - x_min) <= tolerance and abs(x2 - x_min) <= tolerance and
+            abs(x1 - x2) <= tolerance):
+            return True
+        
+        # Check if edge is roughly vertical and colinear with right boundary
+        if (abs(x1 - x_max) <= tolerance and abs(x2 - x_max) <= tolerance and
+            abs(x1 - x2) <= tolerance):
+            return True
+        
+        return False
+
+    def _generate_edge_sample_points(
+        self, 
+        p1: Point2D, 
+        p2: Point2D, 
+        num_points: int = 10, 
+        margin_px: float = 10.0
+    ) -> List[Point2D]:
+        """Generate equally spaced points along an edge, leaving a fixed margin at each end.
+        Always generates at least one point in the center of the line.
+        
+        Args:
+            p1 (Point2D): Start point of the edge
+            p2 (Point2D): End point of the edge
+            num_points (int): Number of sample points to generate
+            margin_px (float): Margin in pixels to leave at each end
+            
+        Returns:
+            List[Point2D]: List of sample points along the edge
+        """
+        # Calculate edge length
+        edge_length: float = math.sqrt((p2[0] - p1[0])**2 + (p2[1] - p1[1])**2)
+        
+        # Always generate center point
+        center_x: float = p1[0] + 0.5 * (p2[0] - p1[0])
+        center_y: float = p1[1] + 0.5 * (p2[1] - p1[1])
+        
+        # If edge is too short to accommodate margins, return just the center point
+        if edge_length <= 2 * margin_px:
+            return [(center_x, center_y)]
+        
+        # Calculate t values for the start and end of the usable region
+        t_start: float = margin_px / edge_length
+        t_end: float = 1.0 - margin_px / edge_length
+        
+        points: List[Point2D] = []
+        
+        # If only one point requested, return center point
+        if num_points == 1:
+            return [(center_x, center_y)]
+        
+        # Generate points evenly spaced within the usable region
+        for i in range(num_points):
+            # Distribute points evenly within the usable region
+            t_local: float = i / (num_points - 1)
+            t: float = t_start + t_local * (t_end - t_start)
+            
+            x: float = p1[0] + t * (p2[0] - p1[0])
+            y: float = p1[1] + t * (p2[1] - p1[1])
+            points.append((x, y))
+        
+        return points
+
+    def _point_in_polygon(
+        self, 
+        point: Point2D, 
+        polygon: PolygonArray, 
+        merge_tolerance: float
+    ) -> bool:
+        """Check if a point is inside a polygon using OpenCV.
+        
+        Args:
+            point (Point2D): Point to test
+            polygon (PolygonArray): Polygon as array of [x, y] coordinates
+            merge_tolerance (float): Tolerance for the point-in-polygon test
+            
+        Returns:
+            bool: True if point is inside the polygon within tolerance
+        """
+        if len(polygon) < 3:
+            return False
+        # Convert polygon to the format expected by cv2.pointPolygonTest
+        poly_points: npt.NDArray[np.float32] = polygon.astype(np.float32).reshape((-1, 1, 2))
+        distance: float = cv2.pointPolygonTest(poly_points, point, True)
+        return distance >= -merge_tolerance
+
+    def _initialize_model(self) -> None:
+        """Initialize the model and tokenizer.
+
+        This method:
+        1. Loads the checkpoint to inspect the saved model configuration
+        2. Dynamically adapts the configuration to match the checkpoint
+        3. Creates a new tokenizer instance
+        4. Initializes the encoder-decoder model with the correct architecture
+        5. Loads the checkpoint weights
+        """
+        # Load checkpoint first to inspect saved model configuration
+        latest_checkpoint: str = self._find_single_checkpoint()
+        checkpoint_path: str = os.path.join(
+            self.experiment_path, "logs", "checkpoints", latest_checkpoint
+        )
+        checkpoint: Dict[str, Any] = torch.load(checkpoint_path, map_location=torch.device("cpu"))
+        
+        # Create a copy of CFG for model creation
+        model_cfg: Any = copy.deepcopy(CFG)
+        
+        # Dynamically determine configuration from the saved positional embeddings
+        decoder_pos_embed_key: str = "decoder.decoder_pos_embed"
+        encoder_pos_embed_key: str = "decoder.encoder_pos_embed"
+        
+        if decoder_pos_embed_key in checkpoint["state_dict"]:
+            saved_decoder_pos_embed_shape: Tuple[int, ...] = checkpoint["state_dict"][decoder_pos_embed_key].shape
+            checkpoint_max_len_minus_1: int = saved_decoder_pos_embed_shape[1]  # Shape is [1, MAX_LEN-1, embed_dim]
+            checkpoint_max_len: int = checkpoint_max_len_minus_1 + 1
+            checkpoint_n_vertices: int = (checkpoint_max_len - 2) // 2  # Reverse: MAX_LEN = (N_VERTICES*2) + 2
+            
+            if checkpoint_n_vertices != CFG.N_VERTICES:
+                model_cfg.N_VERTICES = checkpoint_n_vertices
+                model_cfg.MAX_LEN = checkpoint_max_len
+        
+        if encoder_pos_embed_key in checkpoint["state_dict"]:
+            saved_encoder_pos_embed_shape: Tuple[int, ...] = checkpoint["state_dict"][encoder_pos_embed_key].shape
+            checkpoint_num_patches: int = saved_encoder_pos_embed_shape[1]  # Shape is [1, num_patches, embed_dim]
+            
+            if checkpoint_num_patches != CFG.NUM_PATCHES:
+                model_cfg.NUM_PATCHES = checkpoint_num_patches
+
+        # Create tokenizer with the adapted configuration
+        self.tokenizer = Tokenizer(
+            num_classes=1,
+            num_bins=model_cfg.NUM_BINS,
+            width=model_cfg.INPUT_WIDTH,
+            height=model_cfg.INPUT_HEIGHT,
+            max_len=model_cfg.MAX_LEN,
+        )
+        # Use the original CFG for PAD_IDX to maintain compatibility
+        CFG.PAD_IDX = self.tokenizer.PAD_code
+
+        # Create model with the adapted configuration
+        encoder: Encoder = Encoder(model_name=model_cfg.MODEL_NAME, pretrained=True, out_dim=256)
+        decoder: Decoder = Decoder(
+            cfg=model_cfg,  # Use adapted configuration
+            vocab_size=self.tokenizer.vocab_size,
+            encoder_len=model_cfg.NUM_PATCHES,
+            dim=256,
+            num_heads=8,
+            num_layers=6,
+        )
+        self.model = EncoderDecoder(cfg=model_cfg, encoder=encoder, decoder=decoder)
+        self.model.to(self.device)
+        self.model.eval()
+        
+        # Store the adapted configuration for inference
+        self.model_cfg = model_cfg
+
+        # Load checkpoint weights - should now match perfectly
+        self.model.load_state_dict(checkpoint["state_dict"])
+
+    def _find_single_checkpoint(self) -> str:
+        """Find the single checkpoint file. Crashes if there is more than one checkpoint.
+
+        Returns:
+            str: Filename of the single checkpoint
+
+        Raises:
+            FileNotFoundError: If no checkpoint directory or files are found
+            RuntimeError: If more than one checkpoint file is found
+        """
+        checkpoint_dir: str = os.path.join(self.experiment_path, "logs", "checkpoints")
+        if not os.path.exists(checkpoint_dir):
+            raise FileNotFoundError(f"Checkpoint directory not found: {checkpoint_dir}")
+
+        checkpoint_files: List[str] = [
+            f
+            for f in os.listdir(checkpoint_dir)
+            if f.startswith("epoch_") and f.endswith(".pth")
+        ]
+        if not checkpoint_files:
+            raise FileNotFoundError(f"No checkpoint files found in {checkpoint_dir}")
+
+        if len(checkpoint_files) > 1:
+            raise RuntimeError(
+                f"Multiple checkpoint files found in {checkpoint_dir}: {checkpoint_files}. Expected exactly one checkpoint."
+            )
+
+        return checkpoint_files[0]
+
+    def _process_tiles_batch(
+        self, tiles: List[npt.NDArray[np.uint8]], debug: bool = False
+    ) -> List[TileResult]:
+        """Process a single batch of tiles.
+
+        Args:
+            tiles (list[npt.NDArray[np.uint8]]): List of tile images to process
+
+        Returns:
+            list[TileResult]: List of results for each tile, where each result contains:
+                - polygons: List of polygon coordinates
+        """
+        # Generate cache key and try to load from cache (only when debug=True)
+        if debug:
+            cache_key: str = self._generate_cache_key(tiles)
+            cached_results: Optional[List[TileResult]] = self._load_from_cache(cache_key)
+            if cached_results is not None:
+                log(f"Cache hit for batch of {len(tiles)} tiles")
+                return cached_results
+        else:
+            cache_key = None
+        
+        # Start timing for actual processing
+        batch_start_time: float = time.time()
+        log(f"Processing batch of {len(tiles)} tiles...")
+        valid_transforms: A.Compose = A.Compose(
+            [
+                A.Resize(height=CFG.INPUT_HEIGHT, width=CFG.INPUT_WIDTH),
+                A.Normalize(
+                    mean=[0.0, 0.0, 0.0], std=[1.0, 1.0, 1.0], max_pixel_value=255.0
+                ),
+                ToTensorV2(),
+            ]
+        )
+
+        # Transform each tile individually and stack them
+        transformed_tiles: List[torch.Tensor] = []
+        for tile in tiles:
+            transformed: Dict[str, torch.Tensor] = valid_transforms(image=tile)
+            transformed_tiles.append(transformed["image"])
+
+        # Stack the transformed tiles into a batch
+        batch_tensor: torch.Tensor = torch.stack(transformed_tiles).to(self.device)
+
+        with torch.no_grad():
+            # Use adapted configuration for generation
+            assert self.model_cfg is not None, "Model configuration not initialized"
+            adapted_generation_steps: int = (self.model_cfg.N_VERTICES * 2) + 1
+            batch_preds: torch.Tensor
+            batch_confs: torch.Tensor
+            perm_preds: torch.Tensor
+            batch_preds, batch_confs, perm_preds = test_generate(
+                self.model,
+                batch_tensor,
+                self.tokenizer,
+                max_len=adapted_generation_steps,
+                top_k=0,
+                top_p=1,
+            )
+
+            vertex_coords: List[Optional[npt.NDArray[np.floating[Any]]]]
+            confs: List[Optional[npt.NDArray[np.floating[Any]]]]
+            vertex_coords, confs = postprocess(batch_preds, batch_confs, self.tokenizer)
+
+            results: List[TileResult] = []
+            for j in range(len(tiles)):
+                coord: torch.Tensor
+                if vertex_coords[j] is not None:
+                    coord = torch.from_numpy(vertex_coords[j])
+                else:
+                    coord = torch.tensor([])
+
+                padd: torch.Tensor = torch.ones((self.model_cfg.N_VERTICES - len(coord), 2)).fill_(CFG.PAD_IDX)
+                coord = torch.cat([coord, padd], dim=0)
+
+                batch_polygons: List[List[torch.Tensor]] = permutations_to_polygons(
+                    perm_preds[j : j + 1], [coord], out="torch"
+                )
+
+                valid_polygons: List[PolygonArray] = []
+                for poly in batch_polygons[0]:
+                    poly_filtered: torch.Tensor = poly[poly[:, 0] != CFG.PAD_IDX]
+                    if len(poly_filtered) > 0:
+                        valid_polygons.append(
+                            poly_filtered.cpu().numpy()[:, ::-1]
+                        )  # Convert to [x,y] format
+
+                result: TileResult = {"polygons": valid_polygons}
+
+                results.append(result)
+
+        # Save results to cache (only when debug=True)
+        if debug and cache_key is not None:
+            self._save_to_cache(cache_key, results)
+        
+        # Log processing time per tile
+        batch_time: float = time.time() - batch_start_time
+        log(f"Batch processing time: {batch_time/len(tiles):.3f}s per tile")
+        
+        return results
+
+    def _create_tile_visualization(
+        self,
+        tiles: List[npt.NDArray[np.uint8]],
+        tile_results: List[TileResult],
+        positions: List[TilePosition],
+    ) -> None:
+        """Create a tile visualization showing each tile with its detected polygons and coordinate scales.
+
+        Args:
+            tiles (List[npt.NDArray[np.uint8]]): List of tile images
+            tile_results (List[TileResult]): List of results for each tile
+            positions (List[TilePosition]): List of (x, y, x_end, y_end) tuples for each tile's position
+        """
+        if not tiles:
+            return
+
+        # Calculate grid dimensions based on actual spatial arrangement
+        # Extract unique x and y starting positions
+        x_positions: List[int] = sorted(set(pos[0] for pos in positions))
+        y_positions: List[int] = sorted(set(pos[1] for pos in positions))
+        
+        cols: int = len(x_positions)
+        rows: int = len(y_positions)
+        
+        # Create mapping from (x, y) position to (row, col) index
+        x_to_col: Dict[int, int] = {x: i for i, x in enumerate(x_positions)}
+        y_to_row: Dict[int, int] = {y: i for i, y in enumerate(y_positions)}
+        
+        # Create figure
+        fig: plt.Figure
+        axes: Union[plt.Axes, List[plt.Axes], List[List[plt.Axes]]]
+        fig, axes = plt.subplots(rows, cols, figsize=(cols * 4, rows * 4))
+        
+        # Handle different subplot layouts
+        if rows == 1 and cols == 1:
+            axes = [[axes]]
+        elif rows == 1:
+            axes = [axes]
+        elif cols == 1:
+            axes = [[ax] for ax in axes]
+        
+        # Initialize all subplots as empty
+        for i in range(rows):
+            for j in range(cols):
+                axes[i][j].axis('off')
+
+        # Place each tile in the correct position
+        for i, (tile, tile_result, pos) in enumerate(zip(tiles, tile_results, positions)):
+            x, y, x_end, y_end = pos
+            
+            # Get the grid position for this tile
+            row: int = y_to_row[y]
+            col: int = x_to_col[x]
+            
+            ax: plt.Axes = axes[row][col]
+            
+            # Tiles are already in RGB format, no conversion needed for matplotlib
+            ax.imshow(tile)
+            ax.set_title(f'Tile {i}')
+            
+            # Enable axis and set up coordinate scales
+            ax.axis('on')
+            
+            # Get tile dimensions
+            tile_height: int
+            tile_width: int
+            tile_height, tile_width = tile.shape[:2]
+            
+            # Set up x-axis ticks and labels (global coordinates)
+            x_range: int = x_end - x
+            # Generate tick positions ensuring min and max are included
+            num_x_ticks: int = 8
+            x_tick_positions: List[int]
+            if tile_width > 1:
+                x_tick_positions = [0]  # Always include minimum
+                if num_x_ticks > 2:
+                    # Add intermediate positions
+                    step: float = tile_width / (num_x_ticks - 1)
+                    for i in range(1, num_x_ticks - 1):
+                        x_tick_positions.append(int(i * step))
+                x_tick_positions.append(tile_width - 1)  # Always include maximum
+            else:
+                x_tick_positions = [0]
+            
+            # Calculate corresponding global coordinates
+            x_global_coords: List[int] = [x + pos * x_range // tile_width for pos in x_tick_positions]
+            # Ensure the last coordinate is exactly x_end
+            if len(x_global_coords) > 1:
+                x_global_coords[-1] = x_end
+            
+            ax.set_xticks(x_tick_positions)
+            ax.set_xticklabels([str(coord) for coord in x_global_coords], fontsize=8)
+            
+            # Set up y-axis ticks and labels (global coordinates)
+            y_range: int = y_end - y
+            # Generate tick positions ensuring min and max are included
+            num_y_ticks: int = 8
+            y_tick_positions: List[int]
+            if tile_height > 1:
+                y_tick_positions = [0]  # Always include minimum
+                if num_y_ticks > 2:
+                    # Add intermediate positions
+                    step = tile_height / (num_y_ticks - 1)
+                    for i in range(1, num_y_ticks - 1):
+                        y_tick_positions.append(int(i * step))
+                y_tick_positions.append(tile_height - 1)  # Always include maximum
+            else:
+                y_tick_positions = [0]
+            
+            # Calculate corresponding global coordinates
+            y_global_coords: List[int] = [y + pos * y_range // tile_height for pos in y_tick_positions]
+            # Ensure the last coordinate is exactly y_end
+            if len(y_global_coords) > 1:
+                y_global_coords[-1] = y_end
+            
+            ax.set_yticks(y_tick_positions)
+            ax.set_yticklabels([str(coord) for coord in y_global_coords], fontsize=8)
+            
+            # Set axis limits to match tile dimensions
+            ax.set_xlim(0, tile_width)
+            ax.set_ylim(tile_height, 0)  # Invert y-axis for image coordinates
+            
+            # Style the grid and ticks
+            ax.grid(True, alpha=0.3, linewidth=0.5)
+            ax.tick_params(axis='both', which='major', labelsize=8, length=3)
+            
+            # Draw polygons on this tile
+            polygons: List[PolygonArray] = tile_result["polygons"]
+            polygon_valid: List[bool] = tile_result["polygon_valid"]
+            
+            for poly_idx, (poly, is_valid) in enumerate(zip(polygons, polygon_valid)):
+                if len(poly) > 2:
+                    # Use green for valid polygons, red for invalid ones
+                    color: str = 'g' if is_valid else 'r'
+                    vertex_color: str = 'red' if is_valid else 'darkred'
+                    
+                    # Close the polygon for visualization
+                    poly_closed: PolygonArray = np.vstack([poly, poly[0]])
+                    ax.plot(poly_closed[:, 0], poly_closed[:, 1], f'{color}-', linewidth=2)
+                    
+                    # Draw vertices
+                    ax.scatter(poly[:, 0], poly[:, 1], c=vertex_color, s=20, zorder=5)
+                    
+                    # Calculate centroid and render polygon index
+                    centroid_x: float = np.mean(poly[:, 0])
+                    centroid_y: float = np.mean(poly[:, 1])
+                    
+                    # Use white text with black outline for visibility
+                    text_color: str = 'white'
+                    outline_color: str = 'black'
+                    
+                    # Add text with outline for better visibility
+                    ax.text(centroid_x, centroid_y, str(poly_idx), 
+                           fontsize=12, fontweight='bold', color=text_color,
+                           ha='center', va='center', zorder=6,
+                           bbox=dict(boxstyle='round,pad=0.3', facecolor=outline_color, alpha=0.7))
+
+        # Leave space at the bottom for the model name
+        plt.tight_layout(rect=[0, 0.05, 1, 1])
+        
+        # Add model name at the bottom of the visualization
+        plt.figtext(0.5, 0.01, f'Model: {self.model_display_name}', 
+                   ha='center', va='bottom')
+        
+        plt.savefig('tile-visualization.png', dpi=150, bbox_inches='tight')
+        plt.close()
+        log(f"Saved tile visualization to tile-visualization.png")
+
+    def _validate_all_polygons(
+        self, 
+        tile_results: List[TileResult], 
+        positions: List[TilePosition], 
+        image_height: int, 
+        image_width: int,
+        merge_tolerance: float
+    ) -> List[TileResult]:
+        """Validate all polygons in the tile results and add validation attributes.
+        
+        This method implements a heuristic to validate polygons by checking if their boundary edges
+        have points that are contained in polygons from other tiles.
+        
+        Args:
+            tile_results (List[TileResult]): List of tile results containing polygons
+            positions (List[TilePosition]): List of (x, y, x_end, y_end) tuples for each tile's position
+            image_height (int): Height of the original image
+            image_width (int): Width of the original image
+            merge_tolerance (float): Tolerance for point-in-polygon tests during validation (in pixels)
+            
+        Returns:
+            List[TileResult]: Updated tile results with validation attributes
+        """
+        # Initialize polygon_valid list for each tile
+        for tile_result in tile_results:
+            tile_result["polygon_valid"] = [True] * len(tile_result["polygons"])
+        
+        # Remove overlapping polygons within each tile (before edge validation)
+        
+        for tile_result in tile_results:
+            polygons = tile_result["polygons"]
+            polygon_valid = tile_result["polygon_valid"]
+            
+            if len(polygons) <= 1:
+                continue  # Skip tiles with 0 or 1 polygon
+            
+            # Keep iterating until no overlaps are found
+            while True:
+                # Get currently valid polygons with their indices
+                valid_polygons = [(i, poly) for i, poly in enumerate(polygons) if polygon_valid[i]]
+                
+                if len(valid_polygons) <= 1:
+                    break  # No overlaps possible with 0 or 1 valid polygons
+                
+                # Find all overlapping pairs
+                overlapping_pairs = []
+                for i in range(len(valid_polygons)):
+                    for j in range(i + 1, len(valid_polygons)):
+                        idx1, poly1 = valid_polygons[i]
+                        idx2, poly2 = valid_polygons[j]
+                        
+                        if self._check_polygon_overlap(poly1, poly2):
+                            overlapping_pairs.append((idx1, idx2))
+                
+                if not overlapping_pairs:
+                    break  # No overlaps found
+                
+                # Find all polygons involved in overlaps
+                overlapping_indices = set()
+                for idx1, idx2 in overlapping_pairs:
+                    overlapping_indices.add(idx1)
+                    overlapping_indices.add(idx2)
+                
+                # Calculate areas for overlapping polygons
+                polygon_areas = []
+                for idx in overlapping_indices:
+                    area = self._calculate_polygon_area(polygons[idx])
+                    polygon_areas.append((idx, area))
+                
+                # Find the largest polygon
+                largest_idx, largest_area = max(polygon_areas, key=lambda x: x[1])
+                
+                # Mark the largest polygon as invalid
+                polygon_valid[largest_idx] = False
+                
+                # Continue to next iteration to check for remaining overlaps
+        
+        # Now perform edge validation on remaining valid polygons
+        
+        # Process each tile
+        for tile_result, tile_pos in zip(tile_results, positions):
+            x, y, x_end, y_end = tile_pos
+            tile_width = x_end - x
+            tile_height = y_end - y
+            tile_bounds = (0, 0, tile_width, tile_height)  # tile local coordinates
+            
+            polygons = tile_result["polygons"]
+            polygon_valid = tile_result["polygon_valid"]
+            
+            # Check each polygon in this tile (only those still valid after overlap removal)
+            for poly_idx, polygon in enumerate(polygons):
+                # Skip polygons already rejected for overlap
+                if not polygon_valid[poly_idx]:
+                    continue
+                
+                if len(polygon) < 3:
+                    polygon_valid[poly_idx] = False
+                    continue
+                
+                # Find edges that are near tile boundaries
+                boundary_edges = []
+                for i in range(len(polygon) - 1):
+                    p1 = polygon[i]
+                    p2 = polygon[i + 1]
+                    
+                    if self._is_edge_near_tile_boundary(p1, p2, tile_bounds):
+                        boundary_edges.append((p1, p2))
+                
+                # If no boundary edges, polygon is valid (not on tile boundary)
+                if not boundary_edges:
+                    continue
+                
+                # Check sample points along boundary edges
+                polygon_is_valid = True
+                
+                for p1, p2 in boundary_edges:
+                    sample_points = self._generate_edge_sample_points(p1, p2)
+                    
+                    # Determine if this edge is horizontal or vertical
+                    is_horizontal_edge = abs(p1[1] - p2[1]) <= 2  # Edge is roughly horizontal
+                    is_vertical_edge = abs(p1[0] - p2[0]) <= 2    # Edge is roughly vertical
+                    
+                    # Convert sample points to global image coordinates
+                    global_sample_points = [(px + x, py + y) for px, py in sample_points]
+                    
+                    # Check if each sample point is contained in any polygon from other tiles
+                    for global_point in global_sample_points:
+                        point_found_in_other_polygon = False
+                        
+                        # Check all other tiles
+                        for other_tile_result, other_tile_pos in zip(tile_results, positions):
+                            if other_tile_result is tile_result:
+                                continue
+                            
+                            other_x, other_y, other_x_end, other_y_end = other_tile_pos
+                            
+                            # Skip tiles in same row for horizontal edges
+                            if is_horizontal_edge and other_y == y:
+                                continue
+                            
+                            # Skip tiles in same column for vertical edges  
+                            if is_vertical_edge and other_x == x:
+                                continue
+                            
+                            # Convert global point to other tile's local coordinates
+                            local_point = (global_point[0] - other_x, global_point[1] - other_y)
+                            
+                            # Check if point is inside any valid polygon in this other tile
+                            for other_poly_idx, other_polygon in enumerate(other_tile_result["polygons"]):
+                                # Only consider polygons that are still valid (not rejected for overlap)
+                                if not other_tile_result["polygon_valid"][other_poly_idx]:
+                                    continue
+                                
+                                if self._point_in_polygon(local_point, other_polygon, merge_tolerance):
+                                    point_found_in_other_polygon = True
+                                    break
+                            
+                            if point_found_in_other_polygon:
+                                break
+                    
+                        # If any sample point is not found in other polygons, mark as invalid
+                        if not point_found_in_other_polygon:
+                            polygon_is_valid = False
+                            break
+                    
+                    if not polygon_is_valid:
+                        break
+                
+                # Update polygon validity
+                polygon_valid[poly_idx] = polygon_is_valid
+        
+        return tile_results
+
+    def _merge_polygons(
+        self,
+        tile_results: List[TileResult],
+        positions: List[TilePosition],
+        image_height: int,
+        image_width: int,
+        debug: bool = False,
+    ) -> List[PolygonArray]:
+        """Merge polygon predictions from multiple tiles using a bitmap approach.
+
+        This method creates a bitmap where pixels inside any polygon are set to True,
+        then vectorizes the bitmap back to polygons. This eliminates geometric artifacts
+        from traditional polygon union operations.
+
+        Args:
+            tile_results (list[TileResult]): List of dictionaries containing 'polygons' for each tile
+            positions (list[TilePosition]): List of (x, y, x_end, y_end) tuples for each tile's position
+            image_height (int): Height of the original image
+            image_width (int): Width of the original image
+            debug (bool): Whether to save debug images
+
+        Returns:
+            list[PolygonArray]: List of merged polygons in original image coordinates
+        """
+        # Scale factor for subpixel precision
+        scale_factor: int = 16
+        
+        # Create bitmap at 8x resolution for subpixel precision
+        bitmap: npt.NDArray[np.uint8] = np.zeros((image_height * scale_factor, image_width * scale_factor), dtype=np.uint8)
+        
+        # Process all valid polygons and fill them immediately
+        for tile_result, (x, y, x_end, y_end) in zip(tile_results, positions):
+            tile_polygons: List[PolygonArray] = tile_result["polygons"]
+            polygon_valid: List[bool] = tile_result["polygon_valid"]
+            
+            # Pre-allocate translation vector for this tile
+            translation_vector: npt.NDArray[np.floating[Any]] = np.array([x, y])
+            
+            for poly, is_valid in zip(tile_polygons, polygon_valid):
+                # Skip invalid polygons
+                if not is_valid:
+                    continue
+                    
+                # Transform polygon from tile coordinates to image coordinates
+                transformed_poly: PolygonArray = poly + translation_vector
+                
+                # Scale up coordinates for high-resolution bitmap
+                scaled_poly: PolygonArray = transformed_poly * scale_factor
+                
+                # Ensure coordinates are within scaled bitmap bounds
+                scaled_poly[:, 0] = np.clip(scaled_poly[:, 0], 0, image_width * scale_factor - 1)
+                scaled_poly[:, 1] = np.clip(scaled_poly[:, 1], 0, image_height * scale_factor - 1)
+                
+                # Convert to integer coordinates for rasterization
+                poly_coords: npt.NDArray[np.int32] = scaled_poly.astype(np.int32)
+                
+                # Fill polygon immediately to avoid winding order issues
+                cv2.fillPoly(bitmap, [poly_coords], 255)
+        
+        kernel_size: int = 32
+        kernel: npt.NDArray[np.uint8] = cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (kernel_size, kernel_size))
+        bitmap = cv2.morphologyEx(bitmap, cv2.MORPH_CLOSE, kernel)
+        
+        # Save bitmap for debugging (optional)
+        if debug:
+            cv2.imwrite('bitmap-visualization.png', bitmap)
+            log("Saved bitmap visualization to bitmap-visualization.png")
+        
+        # Find contours in the bitmap
+        contours: List[npt.NDArray[np.int32]]
+        _: Any  # hierarchy not used
+        contours, _ = cv2.findContours(bitmap, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
+        
+        # Collect all valid contours into shapely polygons
+        shapely_polygons: List[Polygon] = []
+        
+        for contour in contours:
+            # Skip very small contours (area is scaled by scale_factor^2)
+            area: float = cv2.contourArea(contour)
+            if area < CFG.MIN_POLYGON_AREA * (scale_factor ** 2):
+                continue
+            
+            # Convert contour to Shapely Polygon
+            contour_points: npt.NDArray[np.float64] = contour.reshape(-1, 2).astype(np.float64)
+            shapely_polygon: Polygon = Polygon(contour_points)
+            
+            shapely_polygon = make_valid(shapely_polygon)
+            
+            # Handle case where make_valid returns a MultiPolygon
+            if shapely_polygon.is_valid:
+                if shapely_polygon.geom_type == 'MultiPolygon':
+                    # Extract individual polygons from MultiPolygon
+                    for individual_poly in shapely_polygon.geoms:
+                        simple_poly: Polygon = Polygon(individual_poly.exterior.coords)
+                        if simple_poly.is_valid and simple_poly.area > 0:
+                            shapely_polygons.append(simple_poly)
+                elif shapely_polygon.geom_type == 'Polygon':
+                    simple_poly = Polygon(shapely_polygon.exterior.coords)
+                    if simple_poly.is_valid and simple_poly.area > 0:
+                        shapely_polygons.append(simple_poly)
+            else:
+                log(f"Skipping invalid polygon")
+        
+        merged_polygons: List[PolygonArray] = []
+        
+        # Create single GeoDataFrame with all polygons and regularize them all at once
+        if shapely_polygons:
+            log(f"Regularizing {len(shapely_polygons)} polygons")
+            gdf: gpd.GeoDataFrame = gpd.GeoDataFrame({'geometry': shapely_polygons})
+            regularized_gdf: gpd.GeoDataFrame = regularize_geodataframe(gdf, simplify_tolerance=20, parallel_threshold=100)
+            
+            # Process the regularized polygons
+            for regularized_polygon in regularized_gdf.geometry:
+                # Extract individual polygons (either from MultiPolygon or single Polygon)
+                individual_polygons = []
+                if regularized_polygon.geom_type == 'MultiPolygon':
+                    individual_polygons = list(regularized_polygon.geoms)
+                elif regularized_polygon.geom_type == 'Polygon':
+                    individual_polygons = [regularized_polygon]
+                
+                # Process each individual polygon with single code path
+                for individual_polygon in individual_polygons:
+                    if individual_polygon.is_valid and individual_polygon.area > 0:
+                        # Convert back to numpy array for OpenCV format
+                        coords: npt.NDArray[np.floating[Any]] = np.array(individual_polygon.exterior.coords[:-1])  # Remove duplicate last point
+                        
+                        # Convert from OpenCV format to our polygon format
+                        if len(coords) >= 3:  # Valid polygon needs at least 3 points
+                            # Scale down coordinates back to original image coordinate system
+                            polygon_coords: PolygonArray = coords.astype(np.float32) / scale_factor
+                            merged_polygons.append(polygon_coords)
+        
+        log(f"Polygons extracted: {len(merged_polygons)}")
+        return merged_polygons
+
+    def infer(self, image_data: bytes, debug: bool = False, merge_tolerance: Optional[float] = None, tile_overlap_ratio: Optional[float] = None) -> List[List[List[float]]]:
+        """Infer polygons in an image.
+
+        Args:
+            image_data (bytes): Raw image data
+            debug (bool): Whether to save debug images (tile visualization and bitmap)
+            merge_tolerance (Optional[float]): Tolerance for point-in-polygon tests during validation (in pixels, allows points to be slightly outside). If None, uses CFG.MERGE_TOLERANCE
+            tile_overlap_ratio (Optional[float]): Overlap ratio between tiles (0.0 = no overlap, 1.0 = complete overlap). If None, uses CFG.TILE_OVERLAP_RATIO
+
+        Returns:
+            list[list[list[float]]]: List of polygons where each polygon is a list of [x,y] coordinates.
+                Each coordinate is rounded to 2 decimal places.
+
+        Raises:
+            ValueError: If the image data is invalid, empty, or cannot be decoded
+            RuntimeError: If there are issues with model prediction or polygon processing
+        """
+        if not image_data:
+            raise ValueError("Empty image data provided")
+
+        seed_everything(42)
+
+        # Decode image
+        nparr: npt.NDArray[np.uint8] = np.frombuffer(image_data, np.uint8)
+        image: Optional[npt.NDArray[np.uint8]] = cv2.imdecode(nparr, cv2.IMREAD_COLOR)
+        if image is None:
+            raise ValueError("Failed to decode image data")
+
+        if image.size == 0:
+            raise ValueError("Decoded image is empty")
+
+        # Convert to RGB
+        image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+
+        # Split image into tiles
+        height: int
+        width: int
+        height, width = image.shape[:2]
+        if height == 0 or width == 0:
+            raise ValueError("Invalid image dimensions")
+
+        # Use provided parameters or fall back to config defaults
+        effective_merge_tolerance: float = merge_tolerance if merge_tolerance is not None else CFG.MERGE_TOLERANCE
+        effective_tile_overlap_ratio: float = tile_overlap_ratio if tile_overlap_ratio is not None else CFG.TILE_OVERLAP_RATIO
+
+        overlap_ratio: float = effective_tile_overlap_ratio
+
+        bboxes: List[TilePosition] = calculate_slice_bboxes(
+            image_height=height,
+            image_width=width,
+            slice_height=CFG.TILE_SIZE,
+            slice_width=CFG.TILE_SIZE,
+            overlap_height_ratio=overlap_ratio,
+            overlap_width_ratio=overlap_ratio,
+        )
+
+        tiles: List[npt.NDArray[np.uint8]] = []
+
+        for bbox in bboxes:
+            x1, y1, x2, y2 = bbox
+            tile: npt.NDArray[np.uint8] = image[y1:y2, x1:x2]
+            if tile.size == 0:
+                continue
+            tiles.append(tile)
+
+        log(f"Total number of tiles to process: {len(tiles)}")
+
+        # Process tiles in batches
+        all_results: List[TileResult] = []
+
+        for i in range(0, len(tiles), CFG.PREDICTION_BATCH_SIZE):
+            batch_tiles: List[npt.NDArray[np.uint8]] = tiles[i : i + CFG.PREDICTION_BATCH_SIZE]
+            batch_results: List[TileResult] = self._process_tiles_batch(batch_tiles, debug)
+            all_results.extend(batch_results)
+            
+            tiles_processed_so_far: int = i + len(batch_tiles)
+            total_tiles: int = len(tiles)
+            log(f"Processed batch of {len(batch_tiles)} tiles ({tiles_processed_so_far}/{total_tiles})")
+
+        # Validate all polygons and add validation attributes
+        all_results = self._validate_all_polygons(all_results, bboxes, height, width, effective_merge_tolerance)
+
+        log(f"Validated {sum(sum(tile_result['polygon_valid']) for tile_result in all_results)} out of {sum(len(tile_result['polygons']) for tile_result in all_results)} polygons") 
+
+        # Create tile visualization
+        if debug:
+            self._create_tile_visualization(tiles, all_results, bboxes)
+
+        merged_polygons: List[PolygonArray] = self._merge_polygons(all_results, bboxes, height, width, debug)
+
+        # Convert to list format
+        polygons_list: List[List[List[float]]] = [poly.tolist() for poly in merged_polygons]
+        # Round coordinates to two decimal places
+        polygons_list = [
+            [[round(x, 2), round(y, 2)] for x, y in polygon]
+            for polygon in polygons_list
+        ]
+
+        return polygons_list
diff --git a/predict_mass_roads_test_set.py b/predict_mass_roads_test_set.py
index 10b21c5..37ee5cc 100644
--- a/predict_mass_roads_test_set.py
+++ b/predict_mass_roads_test_set.py
@@ -23,55 +23,11 @@
     test_generate,
     postprocess,
     permutations_to_polygons,
+    calculate_slice_bboxes,
 )
 import time
 
 
-# adapted from https://github.com/obss/sahi/blob/e798c80d6e09079ae07a672c89732dd602fe9001/sahi/slicing.py#L30, MIT License
-def calculate_slice_bboxes(
-    image_height: int,
-    image_width: int,
-    slice_height: int = 512,
-    slice_width: int = 512,
-    overlap_height_ratio: float = 0.2,
-    overlap_width_ratio: float = 0.2,
-) -> list[list[int]]:
-    """
-    Given the height and width of an image, calculates how to divide the image into
-    overlapping slices according to the height and width provided. These slices are returned
-    as bounding boxes in xyxy format.
-    :param image_height: Height of the original image.
-    :param image_width: Width of the original image.
-    :param slice_height: Height of each slice
-    :param slice_width: Width of each slice
-    :param overlap_height_ratio: Fractional overlap in height of each slice (e.g. an overlap of 0.2 for a slice of size 100 yields an overlap of 20 pixels)
-    :param overlap_width_ratio: Fractional overlap in width of each slice (e.g. an overlap of 0.2 for a slice of size 100 yields an overlap of 20 pixels)
-    :return: a list of bounding boxes in xyxy format
-    """
-
-    slice_bboxes = []
-    y_max = y_min = 0
-    y_overlap = int(overlap_height_ratio * slice_height)
-    x_overlap = int(overlap_width_ratio * slice_width)
-    while y_max < image_height:
-        x_min = x_max = 0
-        y_max = y_min + slice_height
-        while x_max < image_width:
-            x_max = x_min + slice_width
-            if y_max > image_height or x_max > image_width:
-                xmax = min(image_width, x_max)
-                ymax = min(image_height, y_max)
-                xmin = max(0, xmax - slice_width)
-                ymin = max(0, ymax - slice_height)
-                slice_bboxes.append([xmin, ymin, xmax, ymax])
-            else:
-                slice_bboxes.append([x_min, y_min, x_max, y_max])
-            x_min = x_max - x_overlap
-        y_min = y_max - y_overlap
-
-    return slice_bboxes
-
-
 def get_rectangle_params_from_pascal_bbox(bbox):
     xmin_top_left, ymin_top_left, xmax_bottom_right, ymax_bottom_right = bbox
 
diff --git a/start_api.sh b/start_api.sh
new file mode 100755
index 0000000..f548f99
--- /dev/null
+++ b/start_api.sh
@@ -0,0 +1,12 @@
+#!/bin/bash
+
+# Exit on error
+set -e
+
+# Activate conda environment
+source $(conda info --base)/etc/profile.d/conda.sh
+conda activate pix2poly
+
+# Start the API server
+echo "Starting API server"
+uvicorn api:app --host 0.0.0.0 --port 8080 --workers 1 --backlog 10
diff --git a/utils.py b/utils.py
index 33eab91..49f6e2f 100644
--- a/utils.py
+++ b/utils.py
@@ -10,6 +10,9 @@
 from torchmetrics.functional.classification import binary_jaccard_index, binary_accuracy
 from config import CFG
 
+import sys
+from datetime import datetime
+
 
 def seed_everything(seed=1234):
     random.seed(seed)
@@ -57,7 +60,6 @@ def create_mask(tgt, pad_idx):
 
     return tgt_mask, tgt_padding_mask
 
-
 class AverageMeter:
     def __init__(self, name="Metric"):
         self.name = name
@@ -356,3 +358,57 @@ def save_single_predictions_as_images(
     torchvision.utils.save_image(y_perm[:, None, :, :]*255, f"{folder}/gt_perm_matrix_{idx}.png")
 
     return metrics_dict
+
+
+def log(message: str, level: str = "INFO") -> None:
+    """Simple logging function that outputs to stderr."""
+    timestamp = datetime.now().isoformat()
+    print(f"[{timestamp}] [{level}] {message}", file=sys.stderr, flush=True)
+
+
+def calculate_slice_bboxes(
+    image_height: int,
+    image_width: int,
+    slice_height: int = 512,
+    slice_width: int = 512,
+    overlap_height_ratio: float = 0.2,
+    overlap_width_ratio: float = 0.2,
+) -> list[list[int]]:
+    """
+    Given the height and width of an image, calculates how to divide the image into
+    overlapping slices according to the height and width provided. These slices are returned
+    as bounding boxes in xyxy format.
+    
+    Args:
+        image_height: Height of the original image.
+        image_width: Width of the original image.
+        slice_height: Height of each slice
+        slice_width: Width of each slice
+        overlap_height_ratio: Fractional overlap in height of each slice (e.g. an overlap of 0.2 for a slice of size 100 yields an overlap of 20 pixels)
+        overlap_width_ratio: Fractional overlap in width of each slice (e.g. an overlap of 0.2 for a slice of size 100 yields an overlap of 20 pixels)
+    
+    Returns:
+        A list of bounding boxes in xyxy format
+    """
+    slice_bboxes = []
+    y_max = y_min = 0
+    y_overlap = int(overlap_height_ratio * slice_height)
+    x_overlap = int(overlap_width_ratio * slice_width)
+    
+    while y_max < image_height:
+        x_min = x_max = 0
+        y_max = y_min + slice_height
+        while x_max < image_width:
+            x_max = x_min + slice_width
+            if y_max > image_height or x_max > image_width:
+                xmax = min(image_width, x_max)
+                ymax = min(image_height, y_max)
+                xmin = max(0, xmax - slice_width)
+                ymin = max(0, ymax - slice_height)
+                slice_bboxes.append([xmin, ymin, xmax, ymax])
+            else:
+                slice_bboxes.append([x_min, y_min, x_max, y_max])
+            x_min = x_max - x_overlap
+        y_min = y_max - y_overlap
+
+    return slice_bboxes