pg_orrery/src/gist_tle.c
Ryan Malloy a792e7e083 Extend GiST index to 2-D: altitude + inclination
The 1-D altitude-band index only pruned ~25% of the 22k satellite
catalog (eliminates MEO/GEO/HEO but 75% is LEO).  Adding inclination
as a second indexed dimension prunes an additional ~40% of remaining
candidates — objects in equatorial or low-inclination orbits that
geometrically cannot pass over the observer's latitude.

Key changes:
- tle_alt_range (16 bytes) → tle_orbital_key (32 bytes) with
  inc_low/inc_high fields
- All 8 GiST support functions updated for 2-D bounding boxes
- Penalty uses margin (half-perimeter) not area to avoid degeneracy
  when leaf entries have zero-width inclination ranges
- Picksplit selects split dimension by normalized spread
- && operator now checks altitude AND inclination overlap
- <-> operator remains altitude-only (conjunction screening is
  altitude-dominant)
- SQL operator comments updated for 2-D semantics
- Test adds Equatorial-LEO satellite at ISS altitude but 5° inclination
  to validate inclination-based pruning
2026-02-15 18:10:19 -07:00

573 lines
16 KiB
C

/*
* gist_tle.c -- GiST operator class for 2-D orbital indexing on TLE
*
* Every TLE defines an orbit whose perigee/apogee altitudes and
* inclination form a 2-D bounding box in (altitude, inclination) space.
* Two orbits can only be in proximity if their altitude bands overlap
* AND their inclination ranges overlap -- both necessary but not
* sufficient conditions for conjunction.
*
* The GiST index stores [alt_low, alt_high] x [inc_low, inc_high] keys,
* enabling fast coarse filtering. For leaf entries inc_low == inc_high
* (exact value); internal nodes widen to the bounding box of children.
*
* The && (overlap) operator is always rechecked: real conjunction
* screening requires propagation.
*
* Semi-major axis from Kepler's third law using WGS-72 constants:
* a = (KE / n)^(2/3) [earth radii]
* perigee_km = a*(1-e)*AE - AE
* apogee_km = a*(1+e)*AE - AE
*/
#include "postgres.h"
#include "fmgr.h"
#include "access/gist.h"
#include "access/stratnum.h"
#include "utils/float.h"
#include "norad.h"
#include "types.h"
#include <math.h>
#include <float.h>
PG_FUNCTION_INFO_V1(tle_overlap);
PG_FUNCTION_INFO_V1(tle_alt_distance);
PG_FUNCTION_INFO_V1(gist_tle_compress);
PG_FUNCTION_INFO_V1(gist_tle_decompress);
PG_FUNCTION_INFO_V1(gist_tle_consistent);
PG_FUNCTION_INFO_V1(gist_tle_union);
PG_FUNCTION_INFO_V1(gist_tle_penalty);
PG_FUNCTION_INFO_V1(gist_tle_picksplit);
PG_FUNCTION_INFO_V1(gist_tle_same);
PG_FUNCTION_INFO_V1(gist_tle_distance);
/* Floating-point comparison tolerance (km and radians) */
#define KEY_EPSILON 1.0e-9
/*
* 2-D orbital key extracted from a TLE's mean elements.
* Altitude band (perigee/apogee) plus inclination range.
* This is the GiST internal key -- much cheaper to compare
* than propagating two full state vectors.
*
* For leaf entries: inc_low == inc_high (exact inclination).
* For internal nodes: bounding box over all children.
*/
typedef struct tle_orbital_key
{
double alt_low; /* perigee altitude, km */
double alt_high; /* apogee altitude, km */
double inc_low; /* inclination lower bound, radians */
double inc_high; /* inclination upper bound, radians */
} tle_orbital_key;
/* ----------------------------------------------------------------
* tle_to_orbital_key -- compute [perigee, apogee] x [inc, inc]
*
* Uses WGS-72 KE and AE (the only constants valid for SGP4 elements).
* Degenerate TLEs with n <= 0 map to zero-width ranges at 0.
* Inclination is stored in radians (same as pg_tle).
* ----------------------------------------------------------------
*/
static void
tle_to_orbital_key(const pg_tle *tle, tle_orbital_key *key)
{
double n = tle->mean_motion; /* rad/min */
double e = tle->eccentricity;
double a_er; /* semi-major axis, earth radii */
if (n <= 0.0)
{
key->alt_low = 0.0;
key->alt_high = 0.0;
key->inc_low = 0.0;
key->inc_high = 0.0;
return;
}
a_er = pow(WGS72_KE / n, 2.0 / 3.0);
key->alt_low = a_er * (1.0 - e) * WGS72_AE - WGS72_AE;
key->alt_high = a_er * (1.0 + e) * WGS72_AE - WGS72_AE;
/* Guard against numerical inversion from near-zero eccentricity */
if (key->alt_low > key->alt_high)
{
double tmp = key->alt_low;
key->alt_low = key->alt_high;
key->alt_high = tmp;
}
/* Leaf entry: exact inclination (radians) */
key->inc_low = tle->inclination;
key->inc_high = tle->inclination;
}
/* ----------------------------------------------------------------
* key_overlaps -- do two orbital keys overlap in BOTH dimensions?
*
* Altitude bands AND inclination ranges must both overlap.
* ----------------------------------------------------------------
*/
static inline bool
key_overlaps(const tle_orbital_key *a, const tle_orbital_key *b)
{
return (a->alt_low <= b->alt_high) && (b->alt_low <= a->alt_high)
&& (a->inc_low <= b->inc_high) && (b->inc_low <= a->inc_high);
}
/* ----------------------------------------------------------------
* key_contains -- does outer fully contain inner in both dimensions?
* ----------------------------------------------------------------
*/
static inline bool
key_contains(const tle_orbital_key *outer, const tle_orbital_key *inner)
{
return (outer->alt_low <= inner->alt_low)
&& (inner->alt_high <= outer->alt_high)
&& (outer->inc_low <= inner->inc_low)
&& (inner->inc_high <= outer->inc_high);
}
/* ----------------------------------------------------------------
* key_merge -- expand dst bounding box to encompass src
* ----------------------------------------------------------------
*/
static inline void
key_merge(tle_orbital_key *dst, const tle_orbital_key *src)
{
if (src->alt_low < dst->alt_low)
dst->alt_low = src->alt_low;
if (src->alt_high > dst->alt_high)
dst->alt_high = src->alt_high;
if (src->inc_low < dst->inc_low)
dst->inc_low = src->inc_low;
if (src->inc_high > dst->inc_high)
dst->inc_high = src->inc_high;
}
/* ----------------------------------------------------------------
* alt_separation -- minimum altitude gap between two keys
*
* Returns 0 if the altitude bands overlap.
* Used for KNN distance (altitude-dominant ordering).
* ----------------------------------------------------------------
*/
static inline double
alt_separation(const tle_orbital_key *a, const tle_orbital_key *b)
{
if (a->alt_high < b->alt_low)
return b->alt_low - a->alt_high;
if (b->alt_high < a->alt_low)
return a->alt_low - b->alt_high;
return 0.0;
}
/* ================================================================
* SQL-callable operators
* ================================================================
*/
/*
* tle_overlap(tle, tle) -> bool [the && operator]
*
* True if two TLEs overlap in both altitude AND inclination.
* This is a fast pre-filter: overlapping keys are necessary
* but not sufficient for actual conjunction.
*/
Datum
tle_overlap(PG_FUNCTION_ARGS)
{
pg_tle *a = (pg_tle *) PG_GETARG_POINTER(0);
pg_tle *b = (pg_tle *) PG_GETARG_POINTER(1);
tle_orbital_key ka, kb;
tle_to_orbital_key(a, &ka);
tle_to_orbital_key(b, &kb);
PG_RETURN_BOOL(key_overlaps(&ka, &kb));
}
/*
* tle_alt_distance(tle, tle) -> float8 [the <-> operator]
*
* Minimum altitude-band separation in km. Returns 0 if the bands
* overlap. This is not the physical distance between the objects --
* it is the gap between their orbital shells, useful for ordering
* nearest-neighbor queries without propagation.
*
* Altitude-only: inclination weighting adds complexity without
* meaningful benefit for KNN conjunction screening.
*/
Datum
tle_alt_distance(PG_FUNCTION_ARGS)
{
pg_tle *a = (pg_tle *) PG_GETARG_POINTER(0);
pg_tle *b = (pg_tle *) PG_GETARG_POINTER(1);
tle_orbital_key ka, kb;
tle_to_orbital_key(a, &ka);
tle_to_orbital_key(b, &kb);
PG_RETURN_FLOAT8(alt_separation(&ka, &kb));
}
/* ================================================================
* GiST support functions
* ================================================================
*/
/*
* gist_tle_compress -- extract orbital key from a leaf TLE
*
* Leaf entries carry the full pg_tle; we compress to tle_orbital_key.
* Internal entries are already tle_orbital_key from union operations.
*/
Datum
gist_tle_compress(PG_FUNCTION_ARGS)
{
GISTENTRY *entry = (GISTENTRY *) PG_GETARG_POINTER(0);
GISTENTRY *retval;
if (entry->leafkey)
{
pg_tle *tle = (pg_tle *) DatumGetPointer(entry->key);
tle_orbital_key *key = (tle_orbital_key *) palloc(sizeof(tle_orbital_key));
tle_to_orbital_key(tle, key);
retval = (GISTENTRY *) palloc(sizeof(GISTENTRY));
gistentryinit(*retval, PointerGetDatum(key),
entry->rel, entry->page, entry->offset, false);
}
else
{
/* Internal node: already a tle_orbital_key */
retval = entry;
}
PG_RETURN_POINTER(retval);
}
/*
* gist_tle_decompress -- identity (we operate on compressed keys directly)
*/
Datum
gist_tle_decompress(PG_FUNCTION_ARGS)
{
PG_RETURN_POINTER(PG_GETARG_POINTER(0));
}
/*
* gist_tle_consistent -- can this subtree contain matches for the query?
*
* Checks overlap in both altitude AND inclination dimensions.
* Always sets recheck = true because 2-D overlap is only a necessary
* condition -- the real conjunction test requires propagation.
*/
Datum
gist_tle_consistent(PG_FUNCTION_ARGS)
{
GISTENTRY *entry = (GISTENTRY *) PG_GETARG_POINTER(0);
pg_tle *query = (pg_tle *) PG_GETARG_POINTER(1);
StrategyNumber strategy = (StrategyNumber) PG_GETARG_UINT16(2);
/* arg 3 is the query type OID, unused */
bool *recheck = (bool *) PG_GETARG_POINTER(4);
tle_orbital_key *key = (tle_orbital_key *) DatumGetPointer(entry->key);
tle_orbital_key query_key;
bool result;
tle_to_orbital_key(query, &query_key);
*recheck = true;
switch (strategy)
{
case RTOverlapStrategyNumber: /* && */
result = key_overlaps(key, &query_key);
break;
case RTContainedByStrategyNumber: /* <@ */
if (GIST_LEAF(entry))
result = key_contains(&query_key, key);
else
result = key_overlaps(key, &query_key);
break;
case RTContainsStrategyNumber: /* @> */
if (GIST_LEAF(entry))
result = key_contains(key, &query_key);
else
result = key_overlaps(key, &query_key);
break;
default:
elog(ERROR, "gist_tle_consistent: unrecognized strategy %d",
strategy);
result = false;
break;
}
PG_RETURN_BOOL(result);
}
/*
* gist_tle_union -- compute 2-D bounding box for a set of entries
*
* The union is [min(alt_low), max(alt_high)] x [min(inc_low), max(inc_high)].
*/
Datum
gist_tle_union(PG_FUNCTION_ARGS)
{
GistEntryVector *entryvec = (GistEntryVector *) PG_GETARG_POINTER(0);
int *sizep = (int *) PG_GETARG_POINTER(1);
int i;
tle_orbital_key *result;
tle_orbital_key *cur;
result = (tle_orbital_key *) palloc(sizeof(tle_orbital_key));
cur = (tle_orbital_key *) DatumGetPointer(entryvec->vector[0].key);
*result = *cur;
for (i = 1; i < entryvec->n; i++)
{
cur = (tle_orbital_key *) DatumGetPointer(entryvec->vector[i].key);
key_merge(result, cur);
}
*sizep = sizeof(tle_orbital_key);
PG_RETURN_POINTER(result);
}
/*
* gist_tle_penalty -- cost of inserting a new entry into an existing subtree
*
* Uses margin (half-perimeter) instead of area. Leaf entries have
* inc_low == inc_high, giving zero area -- area-based penalty would
* degenerate to 0 for every insertion, making the tree random.
* Margin remains non-zero for degenerate (zero-width) bounding boxes.
*/
Datum
gist_tle_penalty(PG_FUNCTION_ARGS)
{
GISTENTRY *origentry = (GISTENTRY *) PG_GETARG_POINTER(0);
GISTENTRY *newentry = (GISTENTRY *) PG_GETARG_POINTER(1);
float *penalty = (float *) PG_GETARG_POINTER(2);
tle_orbital_key *orig = (tle_orbital_key *) DatumGetPointer(origentry->key);
tle_orbital_key *add = (tle_orbital_key *) DatumGetPointer(newentry->key);
double orig_margin;
double merged_margin;
orig_margin = (orig->alt_high - orig->alt_low)
+ (orig->inc_high - orig->inc_low);
merged_margin = (fmax(orig->alt_high, add->alt_high) - fmin(orig->alt_low, add->alt_low))
+ (fmax(orig->inc_high, add->inc_high) - fmin(orig->inc_low, add->inc_low));
*penalty = (float)(merged_margin - orig_margin);
PG_RETURN_POINTER(penalty);
}
/*
* Comparison callback for qsort in picksplit.
* Sorts entries by a sort key chosen at call time.
*/
typedef struct
{
int index; /* position in the original entry vector */
double sortval; /* midpoint in the chosen dimension */
} picksplit_item;
static int
picksplit_cmp(const void *a, const void *b)
{
double ma = ((const picksplit_item *) a)->sortval;
double mb = ((const picksplit_item *) b)->sortval;
if (ma < mb)
return -1;
if (ma > mb)
return 1;
return 0;
}
/*
* gist_tle_picksplit -- split an overfull page into two groups
*
* Standard R-tree approach: compute spread in both dimensions, split
* along whichever dimension has the greater spread. This prevents
* the tree from becoming biased toward one dimension.
*/
Datum
gist_tle_picksplit(PG_FUNCTION_ARGS)
{
GistEntryVector *entryvec = (GistEntryVector *) PG_GETARG_POINTER(0);
GIST_SPLITVEC *splitvec = (GIST_SPLITVEC *) PG_GETARG_POINTER(1);
int nentries = entryvec->n;
picksplit_item *items;
tle_orbital_key *left_union;
tle_orbital_key *right_union;
tle_orbital_key *cur;
int split_at;
int i;
double alt_min, alt_max, inc_min, inc_max;
double alt_spread, inc_spread;
bool split_on_alt;
/* First pass: compute spread in both dimensions */
cur = (tle_orbital_key *) DatumGetPointer(entryvec->vector[0].key);
alt_min = (cur->alt_low + cur->alt_high) / 2.0;
alt_max = alt_min;
inc_min = (cur->inc_low + cur->inc_high) / 2.0;
inc_max = inc_min;
for (i = 1; i < nentries; i++)
{
double alt_mid, inc_mid;
cur = (tle_orbital_key *) DatumGetPointer(entryvec->vector[i].key);
alt_mid = (cur->alt_low + cur->alt_high) / 2.0;
inc_mid = (cur->inc_low + cur->inc_high) / 2.0;
if (alt_mid < alt_min) alt_min = alt_mid;
if (alt_mid > alt_max) alt_max = alt_mid;
if (inc_mid < inc_min) inc_min = inc_mid;
if (inc_mid > inc_max) inc_max = inc_mid;
}
/*
* Normalize spreads so they're comparable. Altitude is km above
* surface (range ~0-35786), inclination in radians (range 0-pi).
* Divide each by its domain width to get a 0-1 fraction.
*/
alt_spread = (alt_max - alt_min) / 35786.0; /* GEO altitude above surface */
inc_spread = (inc_max - inc_min) / M_PI;
split_on_alt = (alt_spread >= inc_spread);
/* Second pass: compute sort values in the chosen dimension */
items = (picksplit_item *) palloc(sizeof(picksplit_item) * nentries);
for (i = 0; i < nentries; i++)
{
cur = (tle_orbital_key *) DatumGetPointer(entryvec->vector[i].key);
items[i].index = i;
if (split_on_alt)
items[i].sortval = (cur->alt_low + cur->alt_high) / 2.0;
else
items[i].sortval = (cur->inc_low + cur->inc_high) / 2.0;
}
qsort(items, nentries, sizeof(picksplit_item), picksplit_cmp);
split_at = nentries / 2;
/* Allocate offset arrays (GiST uses OffsetNumber, 1-based) */
splitvec->spl_left = (OffsetNumber *) palloc(sizeof(OffsetNumber) * nentries);
splitvec->spl_right = (OffsetNumber *) palloc(sizeof(OffsetNumber) * nentries);
splitvec->spl_nleft = 0;
splitvec->spl_nright = 0;
/* Compute union keys and assign entries */
left_union = (tle_orbital_key *) palloc(sizeof(tle_orbital_key));
right_union = (tle_orbital_key *) palloc(sizeof(tle_orbital_key));
/* Seed the unions from the first entry in each half */
cur = (tle_orbital_key *) DatumGetPointer(
entryvec->vector[items[0].index].key);
*left_union = *cur;
cur = (tle_orbital_key *) DatumGetPointer(
entryvec->vector[items[split_at].index].key);
*right_union = *cur;
for (i = 0; i < nentries; i++)
{
int idx = items[i].index;
cur = (tle_orbital_key *) DatumGetPointer(
entryvec->vector[idx].key);
if (i < split_at)
{
splitvec->spl_left[splitvec->spl_nleft++] =
(OffsetNumber)(idx + 1); /* 1-based */
key_merge(left_union, cur);
}
else
{
splitvec->spl_right[splitvec->spl_nright++] =
(OffsetNumber)(idx + 1);
key_merge(right_union, cur);
}
}
splitvec->spl_ldatum = PointerGetDatum(left_union);
splitvec->spl_rdatum = PointerGetDatum(right_union);
pfree(items);
PG_RETURN_POINTER(splitvec);
}
/*
* gist_tle_same -- equality test on compressed keys
*
* Two orbital keys are "same" if all four bounds match within
* tolerance. This lets the GiST machinery detect duplicate keys.
*/
Datum
gist_tle_same(PG_FUNCTION_ARGS)
{
tle_orbital_key *a = (tle_orbital_key *) PG_GETARG_POINTER(0);
tle_orbital_key *b = (tle_orbital_key *) PG_GETARG_POINTER(1);
bool *result = (bool *) PG_GETARG_POINTER(2);
*result = (fabs(a->alt_low - b->alt_low) < KEY_EPSILON
&& fabs(a->alt_high - b->alt_high) < KEY_EPSILON
&& fabs(a->inc_low - b->inc_low) < KEY_EPSILON
&& fabs(a->inc_high - b->inc_high) < KEY_EPSILON);
PG_RETURN_POINTER(result);
}
/*
* gist_tle_distance -- GiST distance function for KNN ordering
*
* Returns the minimum altitude-band separation in km.
* For overlapping ranges this is 0, making the entry a candidate.
* The planner uses this to drive ORDER BY <-> queries.
*
* Altitude-only: conjunction screening is altitude-dominant.
* Inclination weighting can be added later if needed.
*/
Datum
gist_tle_distance(PG_FUNCTION_ARGS)
{
GISTENTRY *entry = (GISTENTRY *) PG_GETARG_POINTER(0);
pg_tle *query = (pg_tle *) PG_GETARG_POINTER(1);
/* strategy number at arg 2, unused for single-distance class */
tle_orbital_key *key = (tle_orbital_key *) DatumGetPointer(entry->key);
tle_orbital_key query_key;
tle_to_orbital_key(query, &query_key);
PG_RETURN_FLOAT8(alt_separation(key, &query_key));
}