Spaces:
Build error
Build error
| import requests | |
| import urllib3 | |
| import json | |
| from utils import geoutil | |
| import regex_spatial | |
| from shapely.geometry import Polygon, MultiPoint, LineString, Point, mapping | |
| import re | |
| import geopandas as gpd | |
| from geocoder import geo_level1 | |
| from openai import OpenAI | |
| from utils.config import api_key | |
| import numpy as np | |
| client = OpenAI( | |
| api_key=api_key | |
| ) | |
| model = "gpt-4o" | |
| north = ["north", "N'", "North", "NORTH"] | |
| south = ["south", "S'", "South", "SOUTH"] | |
| east = ["east", "E'", "East", "EAST"] | |
| west = ["west", "W'", "West", "WEST"] | |
| northeast = ["north-east", "NE'", "north east", "NORTH-EAST", "North East", "NORTH EAST"] | |
| southeast = ["south-east", "SE'", "south east", "SOUTH-EAST", "South East", "SOUTH EAST"] | |
| northwest = ["north-west", "NW'", "north west", "NORTH-WEST", "North West", "NORTH WEST"] | |
| southwest = ["south-west", "SW'", "south west", "SOUTH-WEST", "South West", "SOUTH WEST"] | |
| center = ["center","central", "downtown","midtown"] | |
| def to_standard_2d_list(data): | |
| arr = np.array(data) | |
| flat = arr.flatten() | |
| if flat.size % 2 != 0: | |
| raise ValueError("元素个数不是2的倍数,不能 reshape 成 [N, 2] 格式") | |
| return flat.reshape(-1, 2).tolist() | |
| def get_geojson(ent, arr, centroid): | |
| poly_json = {} | |
| poly_json['type'] = 'FeatureCollection' | |
| poly_json['features'] = [] | |
| coordinates= [] | |
| coordinates.append(arr) | |
| poly_json['features'].append({ | |
| 'type':'Feature', | |
| 'id': ent, | |
| 'properties': { | |
| 'centroid': centroid | |
| }, | |
| 'geometry': { | |
| 'type':'Polygon', | |
| 'coordinates': coordinates | |
| } | |
| }) | |
| return poly_json | |
| def get_coordinates(ent): | |
| request_url = 'https://nominatim.openstreetmap.org/search.php?q= ' +ent +'&polygon_geojson=1&accept-language=en&format=jsonv2' | |
| headers = { | |
| "User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/18.3 Safari/605.1.15" | |
| } | |
| page = requests.get(request_url, headers=headers, verify=False) | |
| json_content = json.loads(page.content) | |
| all_coordinates = json_content[0]['geojson']['coordinates'][0] | |
| centroid = (float(json_content[0]['lon']), float(json_content[0]['lat'])) | |
| for p in all_coordinates: | |
| p2 = (p[0], p[1]) | |
| angle = geoutil.calculate_bearing(centroid, p2) | |
| p.append(angle) | |
| geojson = get_geojson(ent, all_coordinates, centroid) | |
| return geojson['features'][0]['geometry']['coordinates'][0], geojson['features'][0]['properties']['centroid'] | |
| def get_coordinates(location): | |
| request_url = f'https://nominatim.openstreetmap.org/search.php?q={location}&polygon_geojson=1&accept-language=en&format=jsonv2' | |
| print(request_url) | |
| headers = {"User-Agent": "Mozilla/5.0"} | |
| response = requests.get(request_url, headers=headers, verify=False) | |
| json_content = json.loads(response.content) | |
| if json_content[0]['geojson']['type'] == 'Polygon': | |
| coordinates = json_content[0]['geojson']['coordinates'][0] | |
| elif json_content[0]['geojson']['type'] == 'Point': | |
| coordinates = json_content[0]['geojson']['coordinates'] | |
| else: | |
| print(json_content[0]['geojson']['type']) | |
| centroid = (float(json_content[0]['lon']), float(json_content[0]['lat'])) | |
| return (coordinates, centroid) | |
| # level3 | |
| def get_directional_coordinates_by_angle(coordinates, centroid, direction, minimum, maximum): | |
| direction_coordinates = [] | |
| for p in coordinates: | |
| angle = geoutil.calculate_bearing(centroid, p) | |
| p2 = (p[0], p[1], angle) | |
| if direction in geo_level1.east: | |
| if angle >= minimum or angle <= maximum: | |
| direction_coordinates.append(p2) | |
| else: | |
| if angle >= minimum and angle <= maximum: | |
| direction_coordinates.append(p2) | |
| return direction_coordinates | |
| def get_level3(level3): | |
| digits = re.findall('[0-9]+', level3)[0] | |
| unit = re.findall('[A-Za-z]+', level3)[0] | |
| return digits, unit | |
| def get_direction_coordinates(coordinates, centroid, level1): | |
| min_max = geo_level1.get_min_max(level1) | |
| if min_max is not None: | |
| coord = get_directional_coordinates_by_angle(coordinates, centroid, level1, min_max[0], min_max[1]) | |
| return coord | |
| return coordinates | |
| def sort_west(poly1, poly2, centroid): | |
| coords1 = mapping(poly1)["features"][0]["geometry"]["coordinates"] | |
| coords2 = mapping(poly2)["features"][0]["geometry"]["coordinates"] | |
| coord1 = [] | |
| coord2 = [] | |
| coord = [] | |
| for c in coords1: | |
| pol = list(c[::-1]) | |
| coord1.extend(pol) | |
| for c in coords2: | |
| pol = list(c[::-1]) | |
| coord2.extend(pol) | |
| coo1 = [] | |
| coo2 = [] | |
| for p in coord1: | |
| angle = geoutil.calculate_bearing(centroid, p) | |
| if angle >= 157 and angle <= 202: | |
| coo1.append((p[0], p[1], angle)) | |
| for p in coord2: | |
| angle = geoutil.calculate_bearing(centroid, p) | |
| if angle >= 157 and angle <= 202: | |
| coo2.append((p[0], p[1], angle)) | |
| coo1.extend(coo2) | |
| return coo1 | |
| def get_level3_coordinates(coordinates, level_3, level1): | |
| distance, unit = get_level3(level_3) | |
| kms = geoutil.get_kilometers(distance, unit) | |
| coord = [] | |
| coords0, center = coordinates | |
| if not isinstance(coords0, list) or len(coords0) < 3: | |
| lat_km = 111.32 | |
| lon_km = 111.32 * np.cos(np.radians(center[1])) | |
| dx = dy = 0 | |
| if level1 is not None: | |
| if level1 in geo_level1.east: | |
| dx = kms / lon_km | |
| elif level1 in geo_level1.west: | |
| dx = -kms / lon_km | |
| elif level1 in geo_level1.north: | |
| dy = kms / lat_km | |
| elif level1 in geo_level1.south: | |
| dy = -kms / lat_km | |
| new_center = (center[0] + dx, center[1] + dy) | |
| r_km = 1 | |
| circle_points = [] | |
| for theta in np.linspace(0, 360, num=100): | |
| theta_rad = np.radians(theta) | |
| d_lat = (np.sin(theta_rad) * r_km) / lat_km | |
| d_lon = (np.cos(theta_rad) * r_km) / lon_km | |
| circle_points.append((new_center[0] + d_lon, new_center[1] + d_lat)) | |
| if circle_points: | |
| center_point = MultiPoint(circle_points).centroid | |
| center = (center_point.x, center_point.y) | |
| else: | |
| center = new_center | |
| return circle_points, center | |
| poly1 = Polygon(coords0) | |
| polygon1 = gpd.GeoSeries(poly1) | |
| poly2 = polygon1.buffer(0.0095 * kms, join_style=2) | |
| poly3 = polygon1.buffer(0.013 * kms, join_style=2) | |
| poly = poly3.difference(poly2) | |
| coords = mapping(poly)["features"][0]["geometry"]["coordinates"] | |
| for c in coords: | |
| pol = list(c[::-1]) | |
| coord.extend(pol) | |
| if level1 is not None: | |
| coord = get_direction_coordinates(coord, coordinates[1], level1) | |
| if level1 in geo_level1.west: | |
| coord = sort_west(poly3, poly2, coordinates[1]) | |
| if coord: | |
| center_point = MultiPoint(coord).centroid | |
| center = (center_point.x, center_point.y) | |
| else: | |
| center = coordinates[1] | |
| return coord, center | |
| # between | |
| def get_between_coordinates(coordinates1, coordinates2): | |
| def is_valid_polygon(coords): | |
| return isinstance(coords, list) and len(coords) >= 3 | |
| coords1, center1 = coordinates1 | |
| coords2, center2 = coordinates2 | |
| if is_valid_polygon(coords1): | |
| poly1 = Polygon(coords1) | |
| area1 = poly1.area | |
| else: | |
| area1 = 0 | |
| if is_valid_polygon(coords2): | |
| poly2 = Polygon(coords2) | |
| area2 = poly2.area | |
| else: | |
| area2 = 0 | |
| midpoint = ( | |
| (center1[0] + center2[0]) / 2, | |
| (center1[1] + center2[1]) / 2 | |
| ) | |
| if area1 == 0 and area2 == 0: | |
| r_km = 2 | |
| else: | |
| avg_area = (area1 + area2) / 2 | |
| r_km = np.sqrt(avg_area / np.pi) * 111.32 # 近似 km 半径 | |
| lat_km = 111.32 | |
| lon_km = 111.32 * np.cos(np.radians(midpoint[1])) | |
| circle_points = [] | |
| for theta in np.linspace(0, 360, num=100): | |
| theta_rad = np.radians(theta) | |
| d_lat = (np.sin(theta_rad) * r_km) / lat_km | |
| d_lon = (np.cos(theta_rad) * r_km) / lon_km | |
| circle_points.append((midpoint[0] + d_lon, midpoint[1] + d_lat)) | |
| return circle_points, midpoint | |
| def llmapi(text): | |
| system_prompt = ( | |
| "You are an experienced geographer. Your task is to determine the correct sequence of positioning functions and their inputs based on a given piece of natural language.\n" | |
| "The positioning functions you can choose from are:\n" | |
| "1. Relative Positioning: Inputs is (location coordinate or location name, direction, and distance). Outputs the coordinates that are in the given 'direction' and 'distance' from the input location.\n" | |
| "2. Between Positioning: Inputs is (location 1 coordinates or location 1 name, location 2 coordinates or location 2 name). Outputs the midpoint coordinate between the two locations.\n" | |
| "You can only use the given functions, and the inputs to the functions must obey the above properties. The given functions can be combined to solve complex situations." | |
| "First, perform chain-of-thought (CoT) reasoning, and finally output your answer in JSON format, wrapped between `<<<JSON>>>` and `<<<END>>>`.\n" | |
| "Make sure all inputs only include: location names (strings), step indices (integers), directions (strings, must be in English), or distances (strings with units). Do not return expressions like 'the coordinate 4 km south of Chatswood'.\n" | |
| "Each step must have an 'id'. If the input of a step is the output of a previous step, use that step’s 'id' as the input.\n" | |
| "All directions must be in English (e.g., south, west, northeast, etc.).\n" | |
| "Example output:\n" | |
| "<<<JSON>>>\n" | |
| "[{\"id\": 1, \"function\": \"Relative\", \"inputs\": [\"Chatswood\", \"south\", \"4 km\"]}," | |
| "{\"id\": 2, \"function\": \"Relative\", \"inputs\": [\"North Sydney\", \"west\", \"2 km\"]}," | |
| "{\"id\": 3, \"function\": \"Between\", \"inputs\": [1, 2]}," | |
| "{\"id\": 4, \"function\": \"Relative\", \"inputs\": [3, \"southwest\", \"5 km\"]}]\n" | |
| "<<<END>>>") | |
| messages = [ | |
| {"role": "system", "content": system_prompt}, | |
| {"role": "user", "content": text}, | |
| ] | |
| chat_completion = client.chat.completions.create( | |
| messages=messages, | |
| model=model, | |
| ) | |
| result = chat_completion.choices[0].message.content | |
| json_match = re.search(r'<<<JSON>>>\n(.*?)\n<<<END>>>', result, re.DOTALL) | |
| if json_match: | |
| return json.loads(json_match.group(1)) | |
| else: | |
| raise ValueError("The LLM output does not contain the expected JSON formatted data. Please try again.") | |
| def execute_steps(steps): | |
| data = {} | |
| locations_history = [] | |
| for step in steps: | |
| step_id = step['id'] | |
| function = step['function'] | |
| inputs = step['inputs'] | |
| resolved_inputs = [] | |
| for inp in inputs: | |
| if isinstance(inp, int): | |
| resolved_inputs.append(data[inp]) | |
| else: | |
| resolved_inputs.append(inp) | |
| if function == "Relative": | |
| location, direction, distance = resolved_inputs | |
| if isinstance(location, str): | |
| location = get_coordinates(location) | |
| locations_history.append(location) | |
| location = [to_standard_2d_list(location[0])] + list(location[1:]) | |
| result = get_level3_coordinates(location, distance, direction) | |
| locations_history.append(result) | |
| data[step_id] = result | |
| elif function == "Between": | |
| location1, location2 = resolved_inputs | |
| if isinstance(location1, str): | |
| location1 = get_coordinates(location1) | |
| locations_history.append(location1) | |
| location1 = [to_standard_2d_list(location1[0])] + list(location1[1:]) | |
| if isinstance(location2, str): | |
| location2 = get_coordinates(location2) | |
| locations_history.append(location2) | |
| location2 = [to_standard_2d_list(location2[0])] + list(location2[1:]) | |
| result = get_between_coordinates(location1, location2) | |
| locations_history.append(result) | |
| data[step_id] = result | |
| return [data, locations_history] | |
| if __name__ == '__main__': | |
| parsed_steps = [] | |
| step_loc = execute_steps(parsed_steps) | |
| result = step_loc[0] | |