cprima · January 2, 2025 11:50
diff --git a/README.md b/README.md
diff --git a/generate_roadbook_from_gpx-and-csv.py b/generate_roadbook_from_gpx-and-csv.py
 import gpxpy
 import pandas as pd
 from geopy.distance import geodesic
 from rdp import rdp
 from tqdm import tqdm
 import logging

 # Configure logging to display progress and results
 logging.basicConfig(
    format='%(asctime)s - %(levelname)s - %(message)s',
    level=logging.INFO
 )

 def simplify_gpx(gpx_points, epsilon=0.001):
    """
    Simplify GPX track points using the Ramer-Douglas-Peucker algorithm.

    Args:
        gpx_points (list): List of (latitude, longitude) tuples from the GPX track.
        epsilon (float): Tolerance for simplification; lower values retain more detail.

    Returns:
        list: Simplified list of (latitude, longitude) tuples.
    """
    logging.info(f"Starting GPX simplification with epsilon={epsilon}.")
    simplified_points = rdp(gpx_points, epsilon=epsilon)
    logging.info(f"GPX simplification complete: {len(simplified_points)} points (from {len(gpx_points)}).")
    return simplified_points

 def find_nearest_gpx_index(lat, lon, gpx_points):
    """
    Find the index of the nearest GPX point for a given location.

    Args:
        lat (float): Latitude of the location.
        lon (float): Longitude of the location.
        gpx_points (list): List of (latitude, longitude) tuples from the GPX track.

    Returns:
        int: Index of the nearest GPX point.
    """
    distances = [geodesic((lat, lon), gpx_point).meters for gpx_point in gpx_points]
    return distances.index(min(distances))

 def process_csv_with_smart_sorting(csv_file, gpx_points, output_file):
    """
    Process a CSV file of places and sort them along the GPX track.

    Args:
        csv_file (str): Path to the input CSV file containing places.
        gpx_points (list): List of (latitude, longitude) tuples from the GPX track.
        output_file (str): Path to save the sorted output CSV file.
    """
    logging.info(f"Reading CSV file: {csv_file}")
    df = pd.read_csv(csv_file)

    # Ensure the required columns are present
    if 'Y' not in df.columns or 'X' not in df.columns:
        logging.error("CSV file must contain 'Y' (latitude) and 'X' (longitude) columns.")
        raise ValueError("Missing required columns in CSV file.")
    
    logging.info(f"CSV file loaded with {len(df)} rows.")

    # Simplify GPX points for faster processing
    gpx_points = simplify_gpx(gpx_points)
    
    # Find the nearest GPX point for each place in the CSV
    gpx_indices = []
    logging.info("Finding nearest GPX point for each place...")
    for _, row in tqdm(df.iterrows(), total=len(df), desc="Processing places"):
        lat, lon = row['Y'], row['X']
        gpx_index = find_nearest_gpx_index(lat, lon, gpx_points)
        gpx_indices.append(gpx_index)

    logging.info("Nearest GPX point calculation complete.")

    # Add the GPX indices to the DataFrame
    df['gpx_index'] = gpx_indices

    # Sort the DataFrame by the GPX index
    logging.info("Sorting places based on GPX track order...")
    df = df.sort_values(by='gpx_index').reset_index(drop=True)

    # Save the sorted DataFrame
    logging.info(f"Saving sorted roadbook to: {output_file}")
    df.to_csv(output_file, index=False)
    logging.info("Roadbook saved successfully.")

 # Example Usage
 # File paths for input GPX and CSV, and output CSV
 gpx_file = 'example_route.gpx'
 csv_file = 'places.csv'
 output_file = 'sorted_places.csv'

 # Load GPX points from the input GPX file
 logging.info(f"Loading GPX file: {gpx_file}")
 with open(gpx_file, 'r') as f:
    gpx = gpxpy.parse(f)
 gpx_points = [(point.latitude, point.longitude) for track in gpx.tracks for segment in track.segments for point in segment.points]
 logging.info(f"GPX file loaded with {len(gpx_points)} points.")

 # Process the CSV file and generate the sorted roadbook
 process_csv_with_smart_sorting(csv_file, gpx_points, output_file)
diff --git a/requirements.txt b/requirements.txt
 gpxpy==1.5.0
 pandas==1.5.3
 geopy==2.3.0
 rdp==0.8
 tqdm==4.64.1
Name	Y (Latitude)	X (Longitude)
Gunnison	38.5458	-106.9287
San Francisco	37.7749	-122.4194
Blanding	37.6240	-109.4780
	import gpxpy
	import pandas as pd
	from geopy.distance import geodesic
	from rdp import rdp
	from tqdm import tqdm
	import logging

	# Configure logging to display progress and results
	logging.basicConfig(
	format='%(asctime)s - %(levelname)s - %(message)s',
	level=logging.INFO
	)

	def simplify_gpx(gpx_points, epsilon=0.001):
	"""
	Simplify GPX track points using the Ramer-Douglas-Peucker algorithm.

	Args:
	gpx_points (list): List of (latitude, longitude) tuples from the GPX track.
	epsilon (float): Tolerance for simplification; lower values retain more detail.

	Returns:
	list: Simplified list of (latitude, longitude) tuples.
	"""
	logging.info(f"Starting GPX simplification with epsilon={epsilon}.")
	simplified_points = rdp(gpx_points, epsilon=epsilon)
	logging.info(f"GPX simplification complete: {len(simplified_points)} points (from {len(gpx_points)}).")
	return simplified_points

	def find_nearest_gpx_index(lat, lon, gpx_points):
	"""
	Find the index of the nearest GPX point for a given location.

	Args:
	lat (float): Latitude of the location.
	lon (float): Longitude of the location.
	gpx_points (list): List of (latitude, longitude) tuples from the GPX track.

	Returns:
	int: Index of the nearest GPX point.
	"""
	distances = [geodesic((lat, lon), gpx_point).meters for gpx_point in gpx_points]
	return distances.index(min(distances))

	def process_csv_with_smart_sorting(csv_file, gpx_points, output_file):
	"""
	Process a CSV file of places and sort them along the GPX track.

	Args:
	csv_file (str): Path to the input CSV file containing places.
	gpx_points (list): List of (latitude, longitude) tuples from the GPX track.
	output_file (str): Path to save the sorted output CSV file.
	"""
	logging.info(f"Reading CSV file: {csv_file}")
	df = pd.read_csv(csv_file)

	# Ensure the required columns are present
	if 'Y' not in df.columns or 'X' not in df.columns:
	logging.error("CSV file must contain 'Y' (latitude) and 'X' (longitude) columns.")
	raise ValueError("Missing required columns in CSV file.")

	logging.info(f"CSV file loaded with {len(df)} rows.")

	# Simplify GPX points for faster processing
	gpx_points = simplify_gpx(gpx_points)

	# Find the nearest GPX point for each place in the CSV
	gpx_indices = []
	logging.info("Finding nearest GPX point for each place...")
	for _, row in tqdm(df.iterrows(), total=len(df), desc="Processing places"):
	lat, lon = row['Y'], row['X']
	gpx_index = find_nearest_gpx_index(lat, lon, gpx_points)
	gpx_indices.append(gpx_index)

	logging.info("Nearest GPX point calculation complete.")

	# Add the GPX indices to the DataFrame
	df['gpx_index'] = gpx_indices

	# Sort the DataFrame by the GPX index
	logging.info("Sorting places based on GPX track order...")
	df = df.sort_values(by='gpx_index').reset_index(drop=True)

	# Save the sorted DataFrame
	logging.info(f"Saving sorted roadbook to: {output_file}")
	df.to_csv(output_file, index=False)
	logging.info("Roadbook saved successfully.")

	# Example Usage
	# File paths for input GPX and CSV, and output CSV
	gpx_file = 'example_route.gpx'
	csv_file = 'places.csv'
	output_file = 'sorted_places.csv'

	# Load GPX points from the input GPX file
	logging.info(f"Loading GPX file: {gpx_file}")
	with open(gpx_file, 'r') as f:
	gpx = gpxpy.parse(f)
	gpx_points = [(point.latitude, point.longitude) for track in gpx.tracks for segment in track.segments for point in segment.points]
	logging.info(f"GPX file loaded with {len(gpx_points)} points.")

	# Process the CSV file and generate the sorted roadbook
	process_csv_with_smart_sorting(csv_file, gpx_points, output_file)