Vector Encoding 

Land-Use Analysis

These code snippets illustrate how to convert coordinate data from plain text files into polygonal boundaries for administrative districts, then calculate the proportion of agricultural land cover within each polygon for two years. By leveraging Shapely and GeoPandas, it demonstrates straightforward ways to generate, analyze, and report vector and raster data metrics (e.g., number of agricultural pixels) in a cohesive workflow. 

import pandas as pd

import geopandas as gpd

from shapely.geometry import Polygon

import rasterio.features

import numpy as np


# Part I: Read District Files and Create Polygons

    # Read coordinates from text files and create polygons

    # Store district number, polygon geometry, and vertex count


# Read the district files, skipping the first row

df1 = pd.read_csv("district01.txt", delimiter="\t", names=["X", "Y"], skiprows=1)

df2 = pd.read_csv("district05.txt", delimiter="\t", names=["X", "Y"], skiprows=1)

df3 = pd.read_csv("district06.txt", delimiter="\t", names=["X", "Y"], skiprows=1)


# Create polygons from the extracted coordinates

polygon1 = Polygon(zip(df1["X"], df1["Y"]))

polygon2 = Polygon(zip(df2["X"], df2["Y"]))

polygon3 = Polygon(zip(df3["X"], df3["Y"]))


# Create a GeoDataFrame with 'num_coords' and 'district'

gdf = gpd.GeoDataFrame(

    {

        "district": ["01", "05", "06"],  # District identifiers

        "num_coords": [len(df1), len(df2), len(df3)],  # Number of coordinates per polygon

        "geometry": [polygon1, polygon2, polygon3# Polygon geometries

    },

    crs="EPSG:4326"  # Assign WGS 84 coordinate reference system

)


# Part II: Load Raster Data and Compute Agricultural Land Percentage

    # Load GLOBCOVER rasters for 2004 and 2009

    # Calculate agricultural land coverage within each district


# Define raster file paths

raster_2004 = "GLOBCOVER_2004_lab2.tif"

raster_2009 = "GLOBCOVER_2009_lab2.tif"


# Function to count total and agricultural pixels in each district

def count_pixels(raster_path, gdf):

    with rasterio.open(raster_path) as src# Open raster file

        affine = src.transform

        array = src.read(1# Read first band (land cover classification)


        total_pixel_counts = []

        agri_pixel_counts = []

       

        for _, row in gdf.iterrows():

            # Create a mask for the polygon

            mask = rasterio.features.geometry_mask(

                [row["geometry"]], transform=affine, out_shape=src.shape, invert=True

            )

           

            # Count total pixels inside the polygon

            total_pixels = np.count_nonzero(mask)

           

            # Count agricultural pixels (assuming agriculture is coded as "1")

            agri_pixels = np.count_nonzero((array == 1) & mask)

           

            total_pixel_counts.append(total_pixels)

            agri_pixel_counts.append(agri_pixels)

   

    return total_pixel_counts, agri_pixel_counts


# Compute total and agricultural pixels for 2004

gdf["total_pixels_2004"], gdf["agri_pixels_2004"] = count_pixels(raster_2004, gdf)


# Compute total and agricultural pixels for 2009

gdf["total_pixels_2009"], gdf["agri_pixels_2009"] = count_pixels(raster_2009, gdf)


# Calculate agricultural land percentage for each district

gdf["agri_percent_2004"] = (gdf["agri_pixels_2004"] / gdf["total_pixels_2004"]) * 100

gdf["agri_percent_2009"] = (gdf["agri_pixels_2009"] / gdf["total_pixels_2009"]) * 100


# Print pixel counts and agricultural percentages


# print("\nPixel Totals and Agricultural Pixel Totals by District\n")

# for _, row in gdf.iterrows():

#     print(f"District {row['district']}:")

#     print(f"  Total Pixels: \n    {row['total_pixels_2004']:.0f} in 2004 \n    {row['total_pixels_2009']:.0f} in 2009")

#     print(f"  Agricultural Pixels: \n    {row['agri_pixels_2004']:.0f} in 2004 \n    {row['agri_pixels_2009']:.0f} in 2009\n")


print("\nFinal Agricultural Land Percentages by District\n")

for _, row in gdf.iterrows():

    print(f"District {row['district']}:")

    print(f{row['agri_percent_2004']:.2f}% in 2004")

    print(f{row['agri_percent_2009']:.2f}% in 2009\n")