1 files changed, 98 insertions, 238 deletions
diff --git a/src/backend/optimizer/util/pathnode.c b/src/backend/optimizer/util/pathnode.c
index f1e0f5e3ae3..f3b99f88929 100644
--- a/src/backend/optimizer/util/pathnode.c
+++ b/src/backend/optimizer/util/pathnode.c
@@ -7,7 +7,7 @@
  *
  *
  * IDENTIFICATION
- *	  $Header: /cvsroot/pgsql/src/backend/optimizer/util/pathnode.c,v 1.53 1999/08/06 04:00:17 tgl Exp $
+ *	  $Header: /cvsroot/pgsql/src/backend/optimizer/util/pathnode.c,v 1.54 1999/08/16 02:17:58 tgl Exp $
  *
  *-------------------------------------------------------------------------
  */
@@ -18,16 +18,12 @@
 
 
 #include "optimizer/cost.h"
-#include "optimizer/keys.h"
-#include "optimizer/ordering.h"
 #include "optimizer/pathnode.h"
 #include "optimizer/paths.h"
 #include "optimizer/plancat.h"
 #include "optimizer/restrictinfo.h"
 #include "parser/parsetree.h"
 
-static Path *better_path(Path *new_path, List *unique_paths, bool *is_new);
-
 
 /*****************************************************************************
  *		MISC. PATH UTILITIES
@@ -84,186 +80,104 @@ set_cheapest(RelOptInfo *parent_rel, List *pathlist)
 
 /*
  * add_pathlist
- *	  For each path in the list 'new_paths', add to the list 'unique_paths'
- *	  only those paths that are unique (i.e., unique ordering and ordering
- *	  keys).  Should a conflict arise, the more expensive path is thrown out,
- *	  thereby pruning the plan space.  But we don't prune if xfunc
- *	  told us not to.
+ *	  Construct an output path list by adding to old_paths each path in
+ *	  new_paths that is worth considering --- that is, it has either a
+ *	  better sort order (better pathkeys) or cheaper cost than any of the
+ *	  existing old paths.
  *
- * 'parent_rel' is the relation entry to which these paths correspond.
+ *	  Unless parent_rel->pruneable is false, we also remove from the output
+ *	  pathlist any old paths that are dominated by added path(s) --- that is,
+ *	  some new path is both cheaper and at least as well ordered.
  *
- * Returns the list of unique pathnodes.
+ *	  Note: the list old_paths is destructively modified, and in fact is
+ *	  turned into the output list.
  *
+ * 'parent_rel' is the relation entry to which these paths correspond.
+ * 'old_paths' is the list of previously accepted paths for parent_rel.
+ * 'new_paths' is a list of potential new paths.
+ *
+ * Returns the updated list of interesting pathnodes.
  */
 List *
-add_pathlist(RelOptInfo *parent_rel, List *unique_paths, List *new_paths)
+add_pathlist(RelOptInfo *parent_rel, List *old_paths, List *new_paths)
 {
 	List	   *p1;
 
 	foreach(p1, new_paths)
 	{
 		Path	   *new_path = (Path *) lfirst(p1);
-		Path	   *old_path;
-		bool		is_new;
-
-		/* Is this new path already in unique_paths? */
-		if (member(new_path, unique_paths))
-			continue;
-
-		/* Find best matching path */
-		old_path = better_path(new_path, unique_paths, &is_new);
-
-		if (is_new)
-		{
-			/* This is a brand new path.  */
-			new_path->parent = parent_rel;
-			unique_paths = lcons(new_path, unique_paths);
-		}
-		else if (old_path == NULL)
-		{
-			;					/* do nothing if path is not cheaper */
-		}
-		else if (old_path != NULL)
-		{						/* (IsA(old_path,Path)) { */
-			new_path->parent = parent_rel;
-			if (!parent_rel->pruneable)
-				unique_paths = lcons(new_path, unique_paths);
-			else
-				unique_paths = lcons(new_path,
-									 LispRemove(old_path, unique_paths));
-		}
-	}
-	return unique_paths;
-}
+		bool		accept_new = true; /* unless we find a superior old path */
+		List	   *p2_prev = NIL;
+		List	   *p2;
 
-/*
- * better_path
- *	  Determines whether 'new_path' has the same ordering and keys as some
- *	  path in the list 'unique_paths'.	If there is a redundant path,
- *	  eliminate the more expensive path.
- *
- * Returns:
- *	  The old path - if 'new_path' matches some path in 'unique_paths' and is
- *				cheaper
- *	  nil - if 'new_path' matches but isn't cheaper
- *	  t - if there is no path in the list with the same ordering and keys
- *
- */
-static Path *
-better_path(Path *new_path, List *unique_paths, bool *is_new)
-{
-	Path	   *path = (Path *) NULL;
-	List	   *temp = NIL;
-	int			better_key;
-	int			better_sort;
-
-#ifdef OPTDUP_DEBUG
-	printf("better_path entry\n");
-	printf("new\n");
-	pprint(new_path);
-	printf("unique_paths\n");
-	pprint(unique_paths);
-#endif
-
-	foreach(temp, unique_paths)
-	{
-		path = (Path *) lfirst(temp);
-
-#ifdef OPTDUP_DEBUG
-		if (!pathkeys_match(new_path->pathkeys, path->pathkeys, &better_key) ||
-			better_key != 0)
-		{
-			printf("betterkey = %d\n", better_key);
-			printf("newpath\n");
-			pprint(new_path->pathkeys);
-			printf("oldpath\n");
-			pprint(path->pathkeys);
-			if (path->pathkeys && new_path->pathkeys &&
-				length(lfirst(path->pathkeys)) >= 2		/* &&
-														 * length(lfirst(path->pa
-														 * thkeys)) <
-														 * length(lfirst(new_path
-					->pathkeys)) */ )
-				sleep(0);		/* set breakpoint here */
-		}
-		if (!pathorder_match(new_path->pathorder, path->pathorder,
-							 &better_sort) ||
-			better_sort != 0)
+		/*
+		 * Loop to check proposed new path against old paths.  Note it is
+		 * possible for more than one old path to be tossed out because
+		 * new_path dominates it.
+		 */
+		foreach(p2, old_paths)
 		{
-			printf("neword\n");
-			pprint(new_path->pathorder);
-			printf("oldord\n");
-			pprint(path->pathorder);
-		}
-#endif
+			Path	   *old_path = (Path *) lfirst(p2);
+			bool		remove_old = false;	/* unless new proves superior */
 
-		if (pathkeys_match(new_path->pathkeys, path->pathkeys,
-						   &better_key) &&
-			pathorder_match(new_path->pathorder, path->pathorder,
-							&better_sort))
-		{
+			switch (compare_pathkeys(new_path->pathkeys, old_path->pathkeys))
+			{
+				case PATHKEYS_EQUAL:
+					if (new_path->path_cost < old_path->path_cost)
+						remove_old = true; /* new dominates old */
+					else
+						accept_new = false;	/* old equals or dominates new */
+					break;
+				case PATHKEYS_BETTER1:
+					if (new_path->path_cost <= old_path->path_cost)
+						remove_old = true; /* new dominates old */
+					break;
+				case PATHKEYS_BETTER2:
+					if (new_path->path_cost >= old_path->path_cost)
+						accept_new = false;	/* old dominates new */
+					break;
+				case PATHKEYS_DIFFERENT:
+					/* keep both paths, since they have different ordering */
+					break;
+			}
 
 			/*
-			 * Replace pathkeys that match exactly, {{1,2}}, {{1,2}}
-			 * Replace pathkeys {{1,2}} with {{1,2,3}}} if the latter is
-			 * not more expensive and replace unordered path with ordered
-			 * path if it is not more expensive.  Favor sorted keys over
-			 * unsorted keys in the same way.
+			 * Remove current element from old_list if dominated by new,
+			 * unless xfunc told us not to remove any paths.
 			 */
-			/* same keys, and new is cheaper, use it */
-			if ((better_key == 0 && better_sort == 0 &&
-				 new_path->path_cost < path->path_cost) ||
-
-			/* new is better, and cheaper, use it */
-				(((better_key == 1 && better_sort != 2) ||
-				  (better_key != 2 && better_sort == 1)) &&
-				 new_path->path_cost <= path->path_cost))
+			if (remove_old && parent_rel->pruneable)
 			{
-#ifdef OPTDUP_DEBUG
-				printf("replace with new %p old %p better key %d better sort %d\n", &new_path, &path, better_key, better_sort);
-				printf("new\n");
-				pprint(new_path);
-				printf("old\n");
-				pprint(path);
-#endif
-				*is_new = false;
-				return path;
+				if (p2_prev)
+					lnext(p2_prev) = lnext(p2);
+				else
+					old_paths = lnext(p2);
 			}
+			else
+				p2_prev = p2;
 
-			/* same keys, new is more expensive, stop */
-			if ((better_key == 0 && better_sort == 0 &&
-				 new_path->path_cost >= path->path_cost) ||
+			/*
+			 * If we found an old path that dominates new_path, we can quit
+			 * scanning old_paths; we will not add new_path, and we assume
+			 * new_path cannot dominate any other elements of old_paths.
+			 */
+			if (! accept_new)
+				break;
+		}
 
-			/* old is better, and less expensive, stop */
-				(((better_key == 2 && better_sort != 1) ||
-				  (better_key != 1 && better_sort == 2)) &&
-				 new_path->path_cost >= path->path_cost))
-			{
-#ifdef OPTDUP_DEBUG
-				printf("skip new %p old %p better key %d better sort %d\n", &new_path, &path, better_key, better_sort);
-				printf("new\n");
-				pprint(new_path);
-				printf("old\n");
-				pprint(path);
-#endif
-				*is_new = false;
-				return NULL;
-			}
+		if (accept_new)
+		{
+			/* Accept the path.  Note that it will now be eligible to be
+			 * compared against the additional elements of new_paths...
+			 */
+			new_path->parent = parent_rel; /* not redundant, see prune.c */
+			old_paths = lcons(new_path, old_paths);
 		}
 	}
 
-#ifdef OPTDUP_DEBUG
-	printf("add new %p old %p better key %d better sort %d\n", &new_path, &path, better_key, better_sort);
-	printf("new\n");
-	pprint(new_path);
-#endif
-
-	*is_new = true;
-	return NULL;
+	return old_paths;
 }
 
 
-
 /*****************************************************************************
  *		PATH NODE CREATION ROUTINES
  *****************************************************************************/
@@ -277,19 +191,15 @@ better_path(Path *new_path, List *unique_paths, bool *is_new)
 Path *
 create_seqscan_path(RelOptInfo *rel)
 {
-	int			relid = 0;
-
 	Path	   *pathnode = makeNode(Path);
+	int			relid = 0;
 
 	pathnode->pathtype = T_SeqScan;
 	pathnode->parent = rel;
 	pathnode->path_cost = 0.0;
-	pathnode->pathorder = makeNode(PathOrder);
-	pathnode->pathorder->ordtype = SORTOP_ORDER;
-	pathnode->pathorder->ord.sortop = NULL;
-	pathnode->pathkeys = NIL;
+	pathnode->pathkeys = NIL;	/* seqscan has unordered result */
 
-	if (rel->relids != NULL)
+	if (rel->relids != NIL)		/* can this happen? */
 		relid = lfirsti(rel->relids);
 
 	pathnode->path_cost = cost_seqscan(relid,
@@ -319,12 +229,10 @@ create_index_path(Query *root,
 
 	pathnode->path.pathtype = T_IndexScan;
 	pathnode->path.parent = rel;
-	pathnode->path.pathorder = makeNode(PathOrder);
-	pathnode->path.pathorder->ordtype = SORTOP_ORDER;
-	pathnode->path.pathorder->ord.sortop = index->ordering;
-	pathnode->path.pathkeys = NIL;
+	pathnode->path.pathkeys = build_index_pathkeys(root, rel, index);
 
-	/* Note that we are making a pathnode for a single-scan indexscan;
+	/*
+	 * Note that we are making a pathnode for a single-scan indexscan;
 	 * therefore, both indexid and indexqual should be single-element
 	 * lists.  We initialize indexqual to contain one empty sublist,
 	 * representing a single index traversal with no index restriction
@@ -334,29 +242,7 @@ create_index_path(Query *root,
 	Assert(length(index->relids) == 1);
 	pathnode->indexid = index->relids;
 	pathnode->indexqual = lcons(NIL, NIL);
-
-	pathnode->indexkeys = index->indexkeys;
-
-	/*
-	 * The index must have an ordering for the path to have (ordering)
-	 * keys, and vice versa.
-	 */
-	if (pathnode->path.pathorder->ord.sortop)
-	{
-		pathnode->path.pathkeys = collect_index_pathkeys(index->indexkeys,
-														 rel->targetlist);
-
-		/*
-		 * Check that the keys haven't 'disappeared', since they may no
-		 * longer be in the target list (i.e., index keys that are not
-		 * relevant to the scan are not applied to the scan path node, so
-		 * if no index keys were found, we can't order the path).
-		 */
-		if (pathnode->path.pathkeys == NULL)
-			pathnode->path.pathorder->ord.sortop = NULL;
-	}
-	else
-		pathnode->path.pathkeys = NULL;
+	pathnode->joinrelids = NIL;	/* no join clauses here */
 
 	if (restriction_clauses == NIL)
 	{
@@ -377,7 +263,7 @@ create_index_path(Query *root,
 	{
 		/*
 		 * Compute scan cost for the case when 'index' is used with
-		 * restriction clause(s).
+		 * restriction clause(s).  Also, place indexqual in path node.
 		 */
 		List	   *indexquals;
 		float		npages;
@@ -439,9 +325,9 @@ create_index_path(Query *root,
  *
  * 'joinrel' is the join relation.
  * 'outer_rel' is the outer join relation
- * 'outer_path' is the outer join path.
- * 'inner_path' is the inner join path.
- * 'pathkeys' are the keys of the path
+ * 'outer_path' is the outer path
+ * 'inner_path' is the inner path
+ * 'pathkeys' are the path keys of the new join path
  *
  * Returns the resulting path node.
  *
@@ -461,23 +347,6 @@ create_nestloop_path(RelOptInfo *joinrel,
 	pathnode->innerjoinpath = inner_path;
 	pathnode->pathinfo = joinrel->restrictinfo;
 	pathnode->path.pathkeys = pathkeys;
-	pathnode->path.joinid = NIL;
-	pathnode->path.outerjoincost = (Cost) 0.0;
-	pathnode->path.pathorder = makeNode(PathOrder);
-
-	if (pathkeys)
-	{
-		pathnode->path.pathorder->ordtype = outer_path->pathorder->ordtype;
-		if (outer_path->pathorder->ordtype == SORTOP_ORDER)
-			pathnode->path.pathorder->ord.sortop = outer_path->pathorder->ord.sortop;
-		else
-			pathnode->path.pathorder->ord.merge = outer_path->pathorder->ord.merge;
-	}
-	else
-	{
-		pathnode->path.pathorder->ordtype = SORTOP_ORDER;
-		pathnode->path.pathorder->ord.sortop = NULL;
-	}
 
 	pathnode->path.path_cost = cost_nestloop(outer_path->path_cost,
 											 inner_path->path_cost,
@@ -502,8 +371,7 @@ create_nestloop_path(RelOptInfo *joinrel,
  * 'innerwidth' is the number of bytes per tuple in the inner relation
  * 'outer_path' is the outer path
  * 'inner_path' is the inner path
- * 'pathkeys' are the new keys of the join relation
- * 'order' is the sort order required for the merge
+ * 'pathkeys' are the path keys of the new join path
  * 'mergeclauses' are the applicable join/restriction clauses
  * 'outersortkeys' are the sort varkeys for the outer relation
  * 'innersortkeys' are the sort varkeys for the inner relation
@@ -518,22 +386,29 @@ create_mergejoin_path(RelOptInfo *joinrel,
 					  Path *outer_path,
 					  Path *inner_path,
 					  List *pathkeys,
-					  MergeOrder *order,
 					  List *mergeclauses,
 					  List *outersortkeys,
 					  List *innersortkeys)
 {
 	MergePath  *pathnode = makeNode(MergePath);
 
+	/*
+	 * If the given paths are already well enough ordered, we can skip
+	 * doing an explicit sort.
+	 */
+	if (outersortkeys &&
+		pathkeys_contained_in(outersortkeys, outer_path->pathkeys))
+		outersortkeys = NIL;
+	if (innersortkeys &&
+		pathkeys_contained_in(innersortkeys, inner_path->pathkeys))
+		innersortkeys = NIL;
+
 	pathnode->jpath.path.pathtype = T_MergeJoin;
 	pathnode->jpath.path.parent = joinrel;
 	pathnode->jpath.outerjoinpath = outer_path;
 	pathnode->jpath.innerjoinpath = inner_path;
 	pathnode->jpath.pathinfo = joinrel->restrictinfo;
 	pathnode->jpath.path.pathkeys = pathkeys;
-	pathnode->jpath.path.pathorder = makeNode(PathOrder);
-	pathnode->jpath.path.pathorder->ordtype = MERGE_ORDER;
-	pathnode->jpath.path.pathorder->ord.merge = order;
 	pathnode->path_mergeclauses = mergeclauses;
 	pathnode->outersortkeys = outersortkeys;
 	pathnode->innersortkeys = innersortkeys;
@@ -560,15 +435,11 @@ create_mergejoin_path(RelOptInfo *joinrel,
  * 'innerwidth' is the number of bytes per tuple in the inner relation
  * 'outer_path' is the cheapest outer path
  * 'inner_path' is the cheapest inner path
- * 'pathkeys' are the path keys of the new join path
- * 'operator' is the hashjoin operator
  * 'hashclauses' is a list of the hash join clause (always a 1-element list)
- * 'outerkeys' are the sort varkeys for the outer relation
- * 'innerkeys' are the sort varkeys for the inner relation
  * 'innerdisbursion' is an estimate of the disbursion of the inner hash key
  *
  */
-HashPath   *
+HashPath *
 create_hashjoin_path(RelOptInfo *joinrel,
 					 int outersize,
 					 int innersize,
@@ -576,11 +447,7 @@ create_hashjoin_path(RelOptInfo *joinrel,
 					 int innerwidth,
 					 Path *outer_path,
 					 Path *inner_path,
-					 List *pathkeys,
-					 Oid operator,
 					 List *hashclauses,
-					 List *outerkeys,
-					 List *innerkeys,
 					 Cost innerdisbursion)
 {
 	HashPath   *pathnode = makeNode(HashPath);
@@ -590,16 +457,9 @@ create_hashjoin_path(RelOptInfo *joinrel,
 	pathnode->jpath.outerjoinpath = outer_path;
 	pathnode->jpath.innerjoinpath = inner_path;
 	pathnode->jpath.pathinfo = joinrel->restrictinfo;
-	pathnode->jpath.path.pathkeys = pathkeys;
-	pathnode->jpath.path.pathorder = makeNode(PathOrder);
-	pathnode->jpath.path.pathorder->ordtype = SORTOP_ORDER;
-	pathnode->jpath.path.pathorder->ord.sortop = NULL;
-	pathnode->jpath.path.outerjoincost = (Cost) 0.0;
-	pathnode->jpath.path.joinid = (Relids) NULL;
-	/* pathnode->hashjoinoperator = operator;  */
+	/* A hashjoin never has pathkeys, since its ordering is unpredictable */
+	pathnode->jpath.path.pathkeys = NIL;
 	pathnode->path_hashclauses = hashclauses;
-	pathnode->outerhashkeys = outerkeys;
-	pathnode->innerhashkeys = innerkeys;
 	pathnode->jpath.path.path_cost = cost_hashjoin(outer_path->path_cost,
 												   inner_path->path_cost,
 												   outersize, innersize,