/*     
 *      FILE
 *     	pathnode
 *     
 *      DESCRIPTION
 *     	Routines to manipulate pathlists and create path nodes
 *     
 *      EXPORTS
 *     		path-is-cheaper
 *     		cheaper-path
 *     		set_cheapest
 *     		add_pathlist
 *     		create_seqscan_path
 *     		create_index_path
 *     		create_nestloop_path
 *     		create_mergesort_path
 *     		create_hashjoin_path
 *	$Header: /private/postgres/src/planner/util/RCS/pathnode.c,v 1.25 1992/07/15 00:40:22 joey Exp $
 */
#include <math.h>

#include "planner/internal.h"

#include "nodes/relation.h"
#include "nodes/relation.a.h"
#include "utils/log.h"

#include "planner/pathnode.h"
#include "planner/clauseinfo.h"
#include "planner/cfi.h"
#include "planner/costsize.h"
#include "planner/keys.h"
#include "planner/xfunc.h"

extern int testFlag;

/*    	====================
 *    	MISC. PATH UTILITIES
 *    	====================
 */

/*    
 *    	path-is-cheaper
 *    
 *    	Returns t iff 'path1' is cheaper than 'path2'.
 *    
 */

/*  .. best-innerjoin, better_path, cheaper-path, match-unsorted-outer
 *  .. set_cheapest
 */
bool
path_is_cheaper (path1,path2)
     Path path1,path2 ;
{
    Cost cost1 = get_path_cost (path1);
    Cost cost2 = get_path_cost (path2);

    return((bool)(cost1 < cost2));
}

/*    
 *    	cheaper-path
 *    
 *    	Returns the cheaper of 'path1' and 'path2'.
 *    
 */
Path
cheaper_path (path1,path2)
     Path path1,path2 ;
{
    if ( null(path1) || null (path2) ) {
	elog (WARN,"cheaper-path: bad path");
    } 
    if ( path_is_cheaper (path1,path2) ) {
	return(path1);
    } 
    else {
	return(path2);
    } 
}

/*    
 *    	set_cheapest
 *    
 *    	Finds the minimum cost path from among a relation's paths.  
 *    
 *    	'parent-rel' is the parent relation
 *    	'pathlist' is a list of path nodes corresponding to 'parent-rel'
 *    
 *    	Returns	and sets the relation entry field with the pathnode that 
 *    	is minimum.
 *    
 */

/*  .. prune-rel-path, set_cheapest, sort-relation-paths
 */

Path
set_cheapest (parent_rel,pathlist)
     Rel parent_rel;
     List pathlist ;
{
     List temp_path;
     Path cheapest_so_far;

     Assert(consp(pathlist));
     Assert(IsA(parent_rel,Rel));

     cheapest_so_far = (Path)CAR(pathlist);

     foreach (temp_path,CDR(pathlist)) {
	 Path path = (Path)CAR(temp_path);
	 cheapest_so_far = cheaper_path(path,cheapest_so_far);
     }

     set_cheapestpath (parent_rel,(PathPtr)cheapest_so_far);

     return(cheapest_so_far);
}

/*    
 *    	add_pathlist
 *    
 *    	For each path in the list 'new-paths', add to the list 'unique-paths' 
 *    	only those paths that are unique (i.e., unique ordering and ordering 
 *    	keys).  Should a conflict arise, the more expensive path is thrown out,
 *    	thereby pruning the plan space.
 *    
 *    	'parent-rel' is the relation entry to which these paths correspond.
 *    
 *    	Returns the list of unique pathnodes.
 *    
 */

/*  .. find-all-join-paths, find-rel-paths, prune-joinrel
 */
LispValue
add_pathlist (parent_rel,unique_paths,new_paths)
     Rel parent_rel;
     List unique_paths,new_paths ;
{
     LispValue x;
     Path new_path;
     LispValue old_path;
     foreach (x, new_paths) {
	 new_path = (Path)CAR(x);
	 if (member((LispValue)new_path, unique_paths)) 
	     continue;
	 old_path = better_path (new_path,unique_paths);
	 if (old_path == LispTrue) {
	     /*  Is a brand new path.  */
	     set_parent (new_path,parent_rel);
	     unique_paths = lispCons ((LispValue)new_path,unique_paths);
	
	 }
	 else if (null(old_path))
	   ;  /* do nothing if path is not cheaper */
	 else if (IsA(old_path,Path)) {
	     set_parent (new_path,parent_rel);
	     if (testFlag) {
	         unique_paths = lispCons((LispValue)new_path, unique_paths);
		}
	     else
	         unique_paths = lispCons((LispValue)new_path,
				         LispRemove(old_path,unique_paths));
	 }
     }
     return(unique_paths);
 }

/*    
 *    	better_path
 *    
 *    	Determines whether 'new-path' has the same ordering and keys as some 
 *    	path in the list 'unique-paths'.  If there is a redundant path,
 *    	eliminate the more expensive path.
 *    
 *    	Returns:
 *    	The old path - if 'new-path' matches some path in 'unique-paths' and is
 *    		cheaper
 *    	nil - if 'new-path' matches but isn't cheaper
 *    	t - if there is no path in the list with the same ordering and keys
 *    
 */

/*  .. add_pathlist    */

LispValue
better_path (new_path,unique_paths)
     Path new_path;
     List unique_paths ;
{
     Path old_path = (Path)NULL;
     Path path = (Path)NULL;
     LispValue temp = LispNil;
     LispValue retval = LispNil;

     /* XXX - added the following two lines which weren't int
	the lisp planner, but otherwise, doesn't seem to work
	for the case where new_path is 'nil */
     
     foreach (temp,unique_paths) {
	 path = (Path) CAR(temp);
	 if ((equal_path_path_ordering (get_p_ordering (new_path),
					get_p_ordering(path)) &&
	      samekeys (get_keys (new_path),get_keys (path)))) {
	     old_path = path;
	     break;
	 }
     }
     if ( null(old_path)) {
	 retval = LispTrue;
     } 
     else 
       if (path_is_cheaper (new_path,old_path) || testFlag) {
	   retval = (LispValue)old_path;
       } 
       else
	 retval = LispNil;
     
     return(retval);
}



/*    	===========================
 *    	PATH NODE CREATION ROUTINES
 *    	===========================
 */

/*    
 *    	create_seqscan_path
 *    
 *    	Creates a path corresponding to a sequential scan, returning the
 *    	pathnode.
 *    
 */

/*  .. find-rel-paths
 */
Path
create_seqscan_path (rel)
     Rel rel ;
{
    LispValue relid;

    Path pathnode = RMakePath();

    set_pathtype (pathnode,T_SeqScan); 
    set_parent (pathnode,rel);
    set_path_cost (pathnode,0.0);
    set_p_ordering (pathnode,LispNil);
    set_pathsortkey (pathnode,(SortKey)NULL);
    set_keys (pathnode,LispNil);
    /* copy clauseinfo list into path for expensive function processing 
        -- JMH, 7/7/92 */
    set_locclauseinfo(pathnode,
		      (List)CopyObject(get_clauseinfo(rel)));

    relid = get_relids(rel);
    if (!null(relid))
      relid = CAR(relid);

    set_path_cost (pathnode,cost_seqscan (relid,
					  get_pages (rel),get_tuples (rel)));
    /* add in expensive functions cost!  -- JMH, 7/7/92 */
    set_path_cost(pathnode, 
		  (get_path_cost(pathnode) + xfunc_get_path_cost(pathnode)));
    return(pathnode);
}

/*    
 *    	create_index_path
 *    
 *    	Creates a single path node for an index scan.
 *    
 *    	'rel' is the parent rel
 *    	'index' is the pathnode for the index on 'rel'
 *    	'restriction-clauses' is a list of restriction clause nodes.
 *    	'is-join-scan' is a flag indicating whether or not the index is being
 *    		considered because of its sort order.
 *    
 *    	Returns the new path node.
 *    
 */


/*  .. create-index-paths, find-index-paths
 */

#ifdef __STDC__
IndexPath
create_index_path (
     Rel	rel,
     Rel	index,
     LispValue	restriction_clauses,
     bool	is_join_scan
     )
#else /* #ifdef __STDC__ */
IndexPath
create_index_path (rel,index,restriction_clauses,is_join_scan)
     Rel rel,index;
     LispValue restriction_clauses;
     bool is_join_scan;
#endif /* #ifdef __STDC__ */
{
    IndexPath pathnode = RMakeIndexPath();
    
    set_pathtype ((Path)pathnode,T_IndexScan);
    set_parent ((Path)pathnode,rel);
    set_indexid (pathnode,get_relids (index));
    set_p_ordering ((Path)pathnode,get_ordering (index));
    set_keys ((Path)pathnode,get_indexkeys (index));
    set_pathsortkey((Path)pathnode, (SortKey)NULL);
    set_indexqual(pathnode, LispNil);
    /* copy clauseinfo list into path for expensive function processing 
       -- JMH, 7/7/92 */
    set_locclauseinfo(pathnode,
		      set_difference(CopyObject(get_clauseinfo(rel)),
				     restriction_clauses )); /* 22 dec 1992, garry@maak.msk.su */
/*				     restriction_clauses,
 *				     LispNil)); /* 22 dec 1992, garry@maak.msk.su */

    /*    The index must have an ordering for the
	  path to have (ordering) keys, 
	  and vice versa. */
     
    if ( get_p_ordering ((Path)pathnode)) {
	set_keys ((Path)pathnode,collect_index_pathkeys( get_indexkeys (index),
							 get_targetlist (rel)));
	   /*    Check that the keys haven't 'disappeared', since they may 
		 no longer be in the target list (i.e.,
		 index keys that are not 
		 relevant to the scan are not applied to the scan path node,
		 so if no index keys were found, we can't order the path). */

	   if ( null (get_keys ((Path)pathnode))) {
	       set_p_ordering ((Path)pathnode,LispNil);
	   }
    }
    if(is_join_scan || null (restriction_clauses)) {
	/*    Indices used for joins or sorting result nodes don't
	      restrict the result at all, they simply order it,
	      so compute the scan cost 
	      accordingly -- use a selectivity of 1.0. */
	set_path_cost ( (Path)pathnode,
			cost_index (CInteger(CAR(get_relids(index))),
				    get_pages (index),1.0,
				    get_pages (rel),
				    get_tuples (rel),
				    get_pages (index),
				    get_tuples(index), false));
	/* add in expensive functions cost!  -- JMH, 7/7/92 */
	set_path_cost(pathnode, 
		      (get_path_cost(pathnode) + xfunc_get_path_cost(pathnode)));
    } 
    else  {
	/*    Compute scan cost for the case when 'index' is used with a 
	      restriction clause. */
	LispValue relattvals = get_relattvals (restriction_clauses);
	/* pagesel is '(Cost Cost) */
	List pagesel = index_selectivity (CInteger(CAR(get_relids(index))),
					  get_classlist (index),
					  get_opnos (restriction_clauses),
					  CInteger(getrelid (CInteger
							(CAR(get_relids (rel))),
						    _query_range_table_)),
					  nth (0,relattvals),
					  nth (1,relattvals),
					  nth (2,relattvals),
					  length (restriction_clauses));
	/*   each clause gets an equal selectivity */
	Cost clausesel = 
	  pow (CDouble(CADR (pagesel)),
	       (double)(1/length(restriction_clauses)));
	 
	Count temp1 = (Count)CDouble(CAR(pagesel));
	Cost temp2 = (Cost)CDouble(CADR(pagesel));

	set_indexqual (pathnode,restriction_clauses);
	set_path_cost ( (Path)pathnode,
			cost_index (CInteger(CAR(get_relids(index))),
 				    temp1,
				    temp2,
				    get_pages (rel),
				    get_tuples (rel),get_pages (index),
				    get_tuples (index), false));
	/* add in expensive functions cost!  -- JMH, 7/7/92 */
	set_path_cost(pathnode, 
		      (get_path_cost(pathnode) + xfunc_get_path_cost(pathnode)));

	/*    Set selectivities of clauses used with index to 
	      the selectivity of this index, subdividing the 
	      selectivity equally over each of 
	      the clauses. 
	      */
	/*    XXX Can this divide the selectivities in a better way? */
	
	set_clause_selectivities (restriction_clauses,clausesel);
    }
    return(pathnode);
}

/*    
 *    	create_nestloop_path
 *    
 *    	Creates a pathnode corresponding to a nestloop join between two 
 *    	relations.
 *    
 *    	'joinrel' is the join relation.
 *    	'outer_rel' is the outer join relation
 *    	'outer_path' is the outer join path.
 *    	'inner_path' is the inner join path.
 *    	'keys' are the keys of the path
 *    	
 *    	Returns the resulting path node.
 *    
 */

/*  .. match-unsorted-outer
 */
JoinPath
create_nestloop_path (joinrel,outer_rel,outer_path,inner_path,keys)
     Rel joinrel,outer_rel;
     Path outer_path,inner_path;
     List keys ;
{
     JoinPath pathnode = RMakeJoinPath();
     
     set_pathtype((Path)pathnode,T_NestLoop);
     set_parent ((Path)pathnode,joinrel);
     set_outerjoinpath (pathnode,(pathPtr)outer_path);
     set_innerjoinpath (pathnode,(pathPtr)inner_path);
     set_pathclauseinfo (pathnode,get_clauseinfo (joinrel));
     set_keys ((Path)pathnode,keys);
     set_pathsortkey ((Path)pathnode,(SortKey)NULL);
     set_joinid((Path)pathnode,LispNil);
     set_outerjoincost((Path)pathnode,(Cost)0);
     set_p_ordering((Path)pathnode,LispNil);
     set_locclauseinfo((Path)pathnode,LispNil);

     if /*when */ ( keys) {
	  set_p_ordering ((Path)pathnode,get_p_ordering (outer_path));
     }
     set_path_cost ((Path)pathnode,
		    cost_nestloop (get_path_cost (outer_path),
				   get_path_cost (inner_path),
				   get_size( outer_rel),
				   get_size( get_parent(inner_path)),
				   page_size( get_size(outer_rel),
					      get_width(outer_rel)),
				   IsA(inner_path,IndexPath)));
     /* add in expensive function costs -- JMH 7/7/92 */
     set_path_cost(pathnode, 
		   (get_path_cost(pathnode) + xfunc_get_path_cost(pathnode)));
     return(pathnode);
}

/*    
 *    	create_mergesort_path
 *    
 *    	Creates a pathnode corresponding to a mergesort join between
 *    	two relations
 *    
 *    	'joinrel' is the join relation
 *    	'outersize' is the number of tuples in the outer relation
 *    	'innersize' is the number of tuples in the inner relation
 *    	'outerwidth' is the number of bytes per tuple in the outer relation
 *    	'innerwidth' is the number of bytes per tuple in the inner relation
 *    	'outer_path' is the outer path
 *    	'inner_path' is the inner path
 *    	'keys' are the new keys of the join relation
 *    	'order' is the sort order required for the merge
 *    	'mergeclauses' are the applicable join/restriction clauses
 *    	'outersortkeys' are the sort varkeys for the outer relation
 *    	'innersortkeys' are the sort varkeys for the inner relation
 *    
 */

/*  .. match-unsorted-inner, match-unsorted-outer, sort-inner-and-outer
 */

MergePath
create_mergesort_path (joinrel,outersize,innersize,outerwidth,
		       innerwidth,outer_path,inner_path,keys,order,
		       mergeclauses,outersortkeys,innersortkeys)
     Rel joinrel;
     Count outersize,innersize,outerwidth,innerwidth;
     Path outer_path,inner_path;
     LispValue keys,order,mergeclauses,outersortkeys,innersortkeys ;
{
     MergePath pathnode = RMakeMergePath();

     set_pathtype ((Path)pathnode,T_MergeJoin);
     set_parent ((Path)pathnode,joinrel);
     set_outerjoinpath ((JoinPath)pathnode,(pathPtr)outer_path);
     set_innerjoinpath ((JoinPath)pathnode,(pathPtr)inner_path);
     set_pathclauseinfo ((JoinPath)pathnode,get_clauseinfo (joinrel));
     set_keys ((Path)pathnode,keys);
     set_p_ordering ((Path)pathnode,order);
     set_path_mergeclauses (pathnode,mergeclauses);
     set_locclauseinfo((Path)pathnode,LispNil);
     set_outersortkeys (pathnode,outersortkeys);
     set_innersortkeys (pathnode,innersortkeys);
     set_path_cost ((Path)pathnode, cost_mergesort( get_path_cost (outer_path),
						    get_path_cost (inner_path),
						    outersortkeys,
						    innersortkeys,
						    outersize,
						    innersize,
						    outerwidth,
						    innerwidth));
     /* add in expensive function costs -- JMH 7/7/92 */
     set_path_cost(pathnode, 
		   (get_path_cost(pathnode) + xfunc_get_path_cost(pathnode)));
     return(pathnode);
}

/*    
 *    	create_hashjoin_path
 *    
 *    	XXX HASH
 *    
 *    	Creates a pathnode corresponding to a hash join between two relations.
 *    
 *    	'joinrel' is the join relation
 *    	'outersize' is the number of tuples in the outer relation
 *    	'innersize' is the number of tuples in the inner relation
 *    	'outerwidth' is the number of bytes per tuple in the outer relation
 *    	'innerwidth' is the number of bytes per tuple in the inner relation
 *    	'outer_path' is the outer path
 *    	'inner_path' is the inner path
 *    	'keys' are the new keys of the join relation
 *    	'operator' is the hashjoin operator
 *    	'hashclauses' are the applicable join/restriction clauses
 *    	'outerkeys' are the sort varkeys for the outer relation
 *    	'innerkeys' are the sort varkeys for the inner relation
 *    
 */

/*  .. hash-inner-and-outer
 */

HashPath
create_hashjoin_path (joinrel,outersize,innersize,outerwidth,
		      innerwidth,outer_path,inner_path,keys,operator,
		      hashclauses,outerkeys,innerkeys)
     Rel joinrel;
     Count outersize,innersize,outerwidth,innerwidth;
     Path outer_path,inner_path;
     LispValue keys,hashclauses,outerkeys,innerkeys ;
     ObjectId operator;
{
    HashPath pathnode = RMakeHashPath();

    set_pathtype ((Path)pathnode,T_HashJoin); 
    set_parent ((Path)pathnode,joinrel);
    set_outerjoinpath ((JoinPath)pathnode,(pathPtr)outer_path);
    set_innerjoinpath ((JoinPath)pathnode,(pathPtr)inner_path);
    set_pathclauseinfo ((JoinPath)pathnode,get_clauseinfo (joinrel));
    set_locclauseinfo((Path)pathnode,LispNil);
    set_keys ((Path)pathnode,keys);
    set_pathsortkey ((Path)pathnode,(SortKey)NULL);
    set_p_ordering((Path)pathnode,LispNil);
    set_outerjoincost((Path)pathnode,(Cost)0);
    set_joinid((Path)pathnode, (Relid)NULL);
/*    set_hashjoinoperator (pathnode,operator);  */ 
    set_path_hashclauses (pathnode,hashclauses);
    set_outerhashkeys (pathnode,outerkeys);
    set_innerhashkeys (pathnode,innerkeys);
    set_path_cost ((Path)pathnode,cost_hashjoin( get_path_cost (outer_path),
						 get_path_cost (inner_path),
						 outerkeys,
						 innerkeys,
						 outersize,innersize,
						 outerwidth,innerwidth));
    /* add in expensive function costs -- JMH 7/7/92 */
    set_path_cost(pathnode, 
		  (get_path_cost(pathnode) + xfunc_get_path_cost(pathnode)));
    return(pathnode);
}

