/*
 * (C) Copyright Transarc Corporation 1990
 * Licensed Materials - Property of Transarc
 * All Rights Reserved.
 */

/*------------------------------------------------------------------------
 * xstat_cm.c
 *
 * Description:
 *	Implementation of the client side of the AFS Cache Manager
 *	extended statistics facility.
 *
 *------------------------------------------------------------------------*/

#include <afs/param.h>
#include "xstat_cm.h"			/*Interface for this module*/
#include <lwp.h>			/*Lightweight process package*/

#define LWP_STACK_SIZE	(16 * 1024)

/*
 * Routines we need that don't have explicit include file definitions.
 */
extern char *hostutil_GetNameByINet();	/*Host parsing utility*/

/*
 * Exported variables.
 */
int xstat_cm_numServers;			/*Num connected servers*/
struct xstat_cm_ConnectionInfo
    *xstat_cm_ConnInfo;				/*Ptr to connection array*/
int numCollections;				/*Number of data collections*/
struct xstat_cm_ProbeResults xstat_cm_Results;	/*Latest probe results*/
char terminationEvent;				/*One-shot termination event*/

afs_int32 xstat_cmData[AFSCB_MAX_XSTAT_LONGS];		/*Buffer for collected data*/

/*
 * Private globals.
 */
static int xstat_cm_ProbeFreqInSecs;		/*Probe freq. in seconds*/
static int xstat_cm_initflag = 0;		/*Was init routine called?*/
static int xstat_cm_debug = 0;			/*Debugging output enabled?*/
static int xstat_cm_oneShot = 0;		/*One-shot operation?*/
static int (*xstat_cm_Handler)();		/*Probe handler routine*/
static PROCESS probeLWP_ID;			/*Probe LWP process ID*/
static int xstat_cm_numCollections;		/*Number of desired collections*/
static afs_int32 *xstat_cm_collIDP;			/*Ptr to collection IDs desired*/


/*------------------------------------------------------------------------
 * [private] xstat_cm_CleanupInit
 *
 * Description:
 *	Set up for recovery after an error in initialization (i.e.,
 *	during a call to xstat_cm_Init.
 *
 * Arguments:
 *	None.
 *
 * Returns:
 *	0 on success,
 *	Error value otherwise.
 *
 * Environment:
 *	This routine is private to the module.
 *
 * Side Effects:
 *	Zeros out basic data structures.
 *------------------------------------------------------------------------*/

static int xstat_cm_CleanupInit()

{ /*xstat_cm_CleanupInit*/

    xstat_cm_ConnInfo = (struct xstat_cm_ConnectionInfo *)0;
    xstat_cm_Results.probeNum = 0;
    xstat_cm_Results.probeTime = 0;
    xstat_cm_Results.connP = (struct xstat_cm_ConnectionInfo *)0;
    xstat_cm_Results.collectionNumber = 0;
    xstat_cm_Results.data.AFSCB_CollData_len = AFSCB_MAX_XSTAT_LONGS;
    xstat_cm_Results.data.AFSCB_CollData_val = (afs_int32 *)xstat_cmData;
    xstat_cm_Results.probeOK = 0;

    return(0);

} /*xstat_cm_CleanupInit*/


/*------------------------------------------------------------------------
 * [exported] xstat_cm_Cleanup
 *
 * Description:
 *	Clean up our memory and connection state.
 *
 * Arguments:
 *	int a_releaseMem : Should we free up malloc'ed areas?
 *
 * Returns:
 *	0 on total success,
 *	-1 if the module was never initialized, or there was a problem
 *		with the xstat_cm connection array.
 *
 * Environment:
 *	xstat_cm_numServers should be properly set.  We don't do anything
 *	unless xstat_cm_Init() has already been called.
 *
 * Side Effects:
 *	Shuts down Rx connections gracefully, frees allocated space
 *	(if so directed).
 *------------------------------------------------------------------------*/

int xstat_cm_Cleanup(a_releaseMem)
    int a_releaseMem;

{ /*xstat_cm_Cleanup*/

    static char rn[] = "xstat_cm_Cleanup";	/*Routine name*/
    int code;					/*Return code*/
    int conn_idx;				/*Current connection index*/
    struct xstat_cm_ConnectionInfo *curr_conn;	/*Ptr to xstat_cm connection*/

    /*
     * Assume the best, but check the worst.
     */
    if (!xstat_cm_initflag) {
	fprintf(stderr, "[%s] Refused; module not initialized\n", rn);
	return(-1);
    }
    else
	code = 0;

    /*
     * Take care of all Rx connections first.  Check to see that the
     * server count is a legal value.
     */
    if (xstat_cm_numServers <= 0) {
	fprintf(stderr,
		"[%s] Illegal number of servers (xstat_cm_numServers = %d)\n",
		rn, xstat_cm_numServers);
	code = -1;
    }
    else {
	if (xstat_cm_ConnInfo != (struct xstat_cm_ConnectionInfo *)0) {
	    /*
	     * The xstat_cm connection structure array exists.  Go through
	     * it and close up any Rx connections it holds.
	     */
	    curr_conn = xstat_cm_ConnInfo;
	    for (conn_idx = 0; conn_idx < xstat_cm_numServers; conn_idx++) {
		if (curr_conn->rxconn != (struct rx_connection *)0) {
		    rx_DestroyConnection(curr_conn->rxconn);
		    curr_conn->rxconn = (struct rx_connection *)0;
		}
		curr_conn++;
	    } /*for each xstat_cm connection*/
	} /*xstat_cm connection structure exists*/
    } /*Legal number of servers*/

    /*
     * If asked to, release the space we've allocated.
     */
    if (a_releaseMem) {
	if (xstat_cm_ConnInfo != (struct xstat_cm_ConnectionInfo *)0)
	    free(xstat_cm_ConnInfo);
    }

    /*
     * Return the news, whatever it is.
     */
    return(code);

} /*xstat_cm_Cleanup*/


/*------------------------------------------------------------------------
 * [private] xstat_cm_LWP
 *
 * Description:
 *	This LWP iterates over the server connections and gathers up
 *	the desired statistics from each one on a regular basis, for
 *	all known data collections.  The associated handler function
 *	is called each time a new data collection is received.
 *
 * Arguments:
 *	None.
 *
 * Returns:
 *	Nothing.
 *
 * Environment:
 *	Started by xstat_cm_Init(), uses global structures and the
 *	global private xstat_cm_oneShot variable.
 *
 * Side Effects:
 *	As advertised.
 *------------------------------------------------------------------------*/

static void xstat_cm_LWP()

{ /*xstat_cm_LWP*/

    static char rn[] = "xstat_cm_LWP";		/*Routine name*/
    register afs_int32 code;				/*Results of calls*/
    int oneShotCode;				/*Result of one-shot signal*/
    struct timeval tv;				/*Time structure*/
    int conn_idx;				/*Connection index*/
    struct xstat_cm_ConnectionInfo *curr_conn;	/*Current connection*/
    afs_int32 srvVersionNumber;			/*Xstat version #*/
    afs_int32 clientVersionNumber;			/*Client xstat version*/
    afs_int32 numColls;				/*Number of collections to get*/
    afs_int32 *currCollIDP;				/*Curr collection ID desired*/

    /*
     * Set up some numbers we'll need.
     */
    clientVersionNumber = AFSCB_XSTAT_VERSION;

    while (1) { /*Service loop*/
	/*
	 * Iterate through the server connections, gathering data.
	 * Don't forget to bump the probe count and zero the statistics
	 * areas before calling the servers.
	 */
	if (xstat_cm_debug)
	    printf("[%s] Waking up, getting data from %d server(s)\n",
		   rn, xstat_cm_numServers);
	curr_conn = xstat_cm_ConnInfo;
	xstat_cm_Results.probeNum++;

	for (conn_idx = 0; conn_idx < xstat_cm_numServers; conn_idx++) {
	    /*
	     * Grab the statistics for the current Cache Manager, if the
	     * connection is valid.
	     */
	    if (xstat_cm_debug)
		printf("[%s] Getting collections from Cache Manager '%s'\n",
		       rn, curr_conn->hostName);
	    if (curr_conn->rxconn != (struct rx_connection *)0) {
		if (xstat_cm_debug)
		    printf("[%s] Connection OK, calling RXAFSCB_GetXStats\n",
			   rn);

		/*
		 * Probe the given CM for each desired collection.
		 */
		currCollIDP = xstat_cm_collIDP;
		for (numColls = 0;
		     numColls < xstat_cm_numCollections;
		     numColls++, currCollIDP++) {
		    /*
		     * Initialize the per-probe values.
		     */
		    if (xstat_cm_debug)
			printf("[%s] Asking for data collection %d\n",
			       rn, *currCollIDP);
		    xstat_cm_Results.collectionNumber = *currCollIDP;
		    xstat_cm_Results.data.AFSCB_CollData_len =
			AFSCB_MAX_XSTAT_LONGS;
		    bzero(xstat_cm_Results.data.AFSCB_CollData_val,
			  AFSCB_MAX_XSTAT_LONGS * 4);

		    xstat_cm_Results.connP = curr_conn;

		    if (xstat_cm_debug) {
			printf("%s: Calling RXAFSCB_GetXStats, conn=0x%x, clientVersionNumber=%d, collectionNumber=%d, srvVersionNumberP=0x%x, timeP=0x%x, dataP=0x%x\n",
			       rn, curr_conn->rxconn,
			       clientVersionNumber,
			       *currCollIDP,
			       &srvVersionNumber,
			       &(xstat_cm_Results.probeTime),
			       &(xstat_cm_Results.data));
			printf("%s: [bufflen=%d, buffer at 0x%x]\n",
			       rn,
			       xstat_cm_Results.data.AFSCB_CollData_len,
			       xstat_cm_Results.data.AFSCB_CollData_val);
		    }

		    xstat_cm_Results.probeOK =
			RXAFSCB_GetXStats(curr_conn->rxconn,
					  clientVersionNumber,
					  *currCollIDP,
					  &srvVersionNumber,
					  &(xstat_cm_Results.probeTime),
					  &(xstat_cm_Results.data));
		    
		    /*
		     * Now that we (may) have the data for this connection,
		     * call the associated handler function.  The handler
		     * does not take any explicit parameters, but rather
		     * gets to the goodies via some of the objects exported
		     * by this module.
		     */
		    if (xstat_cm_debug)
			printf("[%s] Calling handler routine.\n",
			       rn);
		    code = xstat_cm_Handler();
		    if (code)
			fprintf(stderr,
				"[%s] Handler routine got error code %d\n",
				rn, code);
		} /*For each collection*/
	    } /*Valid Rx connection*/
	    
	    /*
	     * Advance the xstat_cm connection pointer.
	     */
	    curr_conn++;

	} /*For each xstat_cm connection*/

	/*
	 * All (valid) connections have been probed.  Fall asleep for the
	 * prescribed number of seconds, unless we're a one-shot.  In
	 * that case, we need to signal our caller that we're done.
	 */
	if (xstat_cm_debug)
	    printf("[%s] Polling complete for probe round %d.\n",
		   rn, xstat_cm_Results.probeNum);

	if (xstat_cm_oneShot) {
	    /*
	     * One-shot execution desired.  Signal our main procedure
	     * that we've finished our collection round.
	     */
	    if (xstat_cm_debug)
		printf("[%s] Signalling main process at 0x%x\n",
		       rn, &terminationEvent);
	    oneShotCode = LWP_SignalProcess(&terminationEvent);
	    if (oneShotCode)
		fprintf(stderr,
			"[%s] Error %d from LWP_SignalProcess()",
			rn, oneShotCode);
	    break; /*from the perpetual while loop*/
	} /*One-shot execution*/
	else {
	    /*
	     * Continuous execution desired.  Sleep for the required
	     * number of seconds.
	     */
	    tv.tv_sec  = xstat_cm_ProbeFreqInSecs;
	    tv.tv_usec = 0;
	    if (xstat_cm_debug)
		printf("[%s] Falling asleep for %d seconds\n",
		       rn, xstat_cm_ProbeFreqInSecs);
	    code = IOMGR_Select(0,	/*Num fids*/
				0,	/*Descs ready for reading*/
				0,	/*Descs ready for writing*/
				0,	/*Descs w/exceptional conditions*/
				&tv);	/*Ptr to timeout structure*/
	    if (code)
		fprintf(stderr,
			"[%s] IOMGR_Select returned code %d\n",
			rn, code);
	} /*Continuous execution*/
    } /*Service loop*/

} /*xstat_cm_LWP*/


/*------------------------------------------------------------------------
 * [exported] xstat_cm_Init
 *
 * Description:
 *	Initialize the xstat_cm module: set up Rx connections to the
 *	given set of Cache Managers, start up the probe LWP, and
 *	associate the routine to be called when a probe completes.
 *	Also, let it know which collections you're interested in.
 *
 * Arguments:
 *	int a_numServers		  : Num. servers to connect to.
 *	struct sockaddr_in *a_socketArray : Array of server sockets.
 *	int a_ProbeFreqInSecs		  : Probe frequency in seconds.
 *	int (*a_ProbeHandler)()		  : Ptr to probe handler fcn.
 *	int a_flags;			  : Various flags.
 *	int a_numCollections		  : Number of collections desired.
 *	afs_int32 *a_collIDP			  : Ptr to collection IDs.
 *
 * Returns:
 *	0 on success,
 *	-2 for (at least one) connection error,
 *	LWP process creation code, if it failed,
 *	-1 for other fatal errors.
 *
 * Environment:
 *	*** MUST BE THE FIRST ROUTINE CALLED FROM THIS PACKAGE ***
 *
 * Side Effects:
 *	Sets up just about everything.
 *------------------------------------------------------------------------*/

int xstat_cm_Init(a_numServers, a_socketArray, a_ProbeFreqInSecs,
		  a_ProbeHandler, a_flags, a_numCollections, a_collIDP)
    int a_numServers;
    struct sockaddr_in *a_socketArray;
    int a_ProbeFreqInSecs;
    int (*a_ProbeHandler)();
    int a_flags;
    int a_numCollections;
    afs_int32 *a_collIDP;

{ /*xstat_cm_Init*/

    static char rn[] = "xstat_cm_Init";		/*Routine name*/
    register afs_int32 code;				/*Return value*/
    struct rx_securityClass *secobj;		/*Client security object*/
    int arg_errfound;				/*Argument error found?*/
    int curr_srv;				/*Current server idx*/
    struct xstat_cm_ConnectionInfo *curr_conn;	/*Ptr to current conn*/
    char *hostNameFound;			/*Ptr to returned host name*/
    int conn_err;				/*Connection error?*/
    int collIDBytes;				/*Num bytes in coll ID array*/

    /*
     * If we've already been called, snicker at the bozo, gently
     * remind him of his doubtful heritage, and return success.
     */
    if (xstat_cm_initflag) {
	fprintf(stderr, "[%s] Called multiple times!\n", rn);
	return(0);
    }
    else
	xstat_cm_initflag = 1; 

    /*
     * Check the parameters for bogosities.
     */
    arg_errfound = 0;
    if (a_numServers <= 0) {
	fprintf(stderr, "[%s] Illegal number of servers: %d\n",
		rn, a_numServers);
	arg_errfound = 1;
    }
    if (a_socketArray == (struct sockaddr_in *)0) {
	fprintf(stderr, "[%s] Null server socket array argument\n", rn);
	arg_errfound = 1;
    }
    if (a_ProbeFreqInSecs <= 0) {
	fprintf(stderr, "[%s] Illegal probe frequency: %d\n",
		rn, a_ProbeFreqInSecs);
	arg_errfound = 1;
    }
    if (a_ProbeHandler == (int (*)())0) {
	fprintf(stderr, "[%s] Null probe handler function argument\n",
		rn);
	arg_errfound = 1;
    }
    if (a_numCollections <= 0) {
	fprintf(stderr, "[%s] Illegal collection count argument: %d\n",
		rn, a_numServers);
	arg_errfound = 1;
    }
    if (a_collIDP == (afs_int32 *)0) {
	fprintf(stderr, "[%s] Null collection ID array argument\n", rn);
	arg_errfound = 1;
    }
    if (arg_errfound)
	return(-1);

    /*
     * Record our passed-in info.
     */
    xstat_cm_debug	     = (a_flags & XSTAT_CM_INITFLAG_DEBUGGING);
    xstat_cm_oneShot	     = (a_flags & XSTAT_CM_INITFLAG_ONE_SHOT);
    xstat_cm_numServers      = a_numServers;
    xstat_cm_Handler	     = a_ProbeHandler;
    xstat_cm_ProbeFreqInSecs = a_ProbeFreqInSecs;
    xstat_cm_numCollections  = a_numCollections;
    collIDBytes = xstat_cm_numCollections * sizeof(afs_int32);
    xstat_cm_collIDP	     = (afs_int32 *)(malloc(collIDBytes));
    bcopy(a_collIDP, xstat_cm_collIDP, collIDBytes);
    if (xstat_cm_debug) {
	printf("[%s] Asking for %d collection(s): ", rn, xstat_cm_numCollections);
	for (curr_srv = 0; curr_srv < xstat_cm_numCollections; curr_srv++)
	    printf("%d ", *(xstat_cm_collIDP+curr_srv));
	printf("\n");
    }

    /*
     * Get ready in case we have to do a cleanup - basically, zero
     * everything out.
     */
    code = xstat_cm_CleanupInit();
    if (code)
	return(code);

    /*
     * Allocate the necessary data structures and initialize everything
     * else.
     */
    xstat_cm_ConnInfo =
	(struct xstat_cm_ConnectionInfo *)
	    malloc(a_numServers * sizeof(struct xstat_cm_ConnectionInfo));
    if (xstat_cm_ConnInfo == (struct xstat_cm_ConnectionInfo *)0) {
	fprintf(stderr,
		"[%s] Can't allocate %d connection info structs (%d bytes)\n",
		rn, a_numServers,
		(a_numServers * sizeof(struct xstat_cm_ConnectionInfo)));
	return(-1);	/*No cleanup needs to be done yet*/
    }

    /*
     * Initialize the Rx subsystem, just in case nobody's done it.
     */
    if (xstat_cm_debug)
	printf("[%s] Initializing Rx on port 0\n", rn);
    code = rx_Init(htons(0));
    if (code) {
	fprintf(stderr, "[%s] Fatal error in rx_Init(), error=%d\n",
		rn, code);
	return(-1);
    }

    if (xstat_cm_debug)
	printf("[%s] Rx initialized on port 0\n", rn);

    /*
     * Create a null Rx client security object, to be used by the
     * probe LWP.
     */
    secobj = (struct rx_securityClass *) rxnull_NewClientSecurityObject();
    if (secobj == (struct rx_securityClass *)0) {
	fprintf(stderr,
		"[%s] Can't create probe LWP client security object.\n",
		rn);
	xstat_cm_Cleanup(1); /*Delete already-malloc'ed areas*/
	return(-1);
    }
    if (xstat_cm_debug)
	printf("[%s] Probe LWP client security object created\n",
	       rn);

    curr_conn = xstat_cm_ConnInfo;
    conn_err = 0;
    for (curr_srv = 0; curr_srv < a_numServers; curr_srv++) {
	/*
	 * Copy in the socket info for the current server, resolve its
	 * printable name if possible.
	 */
	if (xstat_cm_debug) {
	    printf("[%s] Copying in the following socket info:\n",
		   rn);
	    printf("[%s] IP addr 0x%lx, port %d\n", rn,
		   (a_socketArray + curr_srv)->sin_addr.s_addr,
		   (a_socketArray + curr_srv)->sin_port);
	}
	bcopy(a_socketArray + curr_srv,
	      &(curr_conn->skt),
	      sizeof(struct sockaddr_in));
	
	hostNameFound =
	    hostutil_GetNameByINet(curr_conn->skt.sin_addr.s_addr);
	if (hostNameFound == (char *)0) {
	    fprintf(stderr,
		    "[%s] Can't map Internet address %lu to a string name\n",
		    rn, curr_conn->skt.sin_addr.s_addr);
	    curr_conn->hostName[0] = '\0';
	}
	else {
	    strcpy(curr_conn->hostName, hostNameFound);
	    if (xstat_cm_debug)
		printf("[%s] Host name for server index %d is %s\n",
		       rn, curr_srv, curr_conn->hostName);
	}
	
	/*
	 * Make an Rx connection to the current server.
	 */
	if (xstat_cm_debug)
	    printf("[%s] Connecting to srv idx %d, IP addr 0x%lx, port %d, service 1\n",
		   rn, curr_srv, curr_conn->skt.sin_addr.s_addr,
		   curr_conn->skt.sin_port);
	curr_conn->rxconn =
	    rx_NewConnection(curr_conn->skt.sin_addr.s_addr, /*Server addr*/
			     curr_conn->skt.sin_port,	     /*Server port*/
			     1,				     /*AFS service #*/
			     secobj,			     /*Security obj*/
			     0);			     /*# of above*/
	if (curr_conn->rxconn == (struct rx_connection *)0) {
	    fprintf(stderr,
		    "[%s] Can't create Rx connection to server '%s' (%lu)\n",
		    rn, curr_conn->hostName, curr_conn->skt.sin_addr.s_addr);
	    conn_err = 1;
	}
	if (xstat_cm_debug)
	    printf("[%s] New connection at 0x%lx\n",
		   rn, curr_conn->rxconn);

	/*
	 * Bump the current xstat_cm connection to set up.
	 */
	curr_conn++;

    } /*for curr_srv*/

    /*
     * Start up the probe LWP.
     */
    if (xstat_cm_debug)
	printf("[%s] Creating the probe LWP\n", rn);
    code =
	LWP_CreateProcess(xstat_cm_LWP,		/*Function to start up*/
			  LWP_STACK_SIZE,	/*Stack size in bytes*/
			  1,			/*Priority*/
			  0,			/*Parameters*/
			  "xstat_cm Worker",	/*Name to use*/
			  &probeLWP_ID);	/*Returned LWP process ID*/
    if (code) {
	fprintf(stderr,
		"[%s] Can't create xstat_cm LWP!  Error is %d\n",
		rn, code);
	xstat_cm_Cleanup(1); /*Delete already-malloc'ed areas*/
	return(code);
    }
    if (xstat_cm_debug)
	printf("[%s] Probe LWP process structure located at 0x%x\n",
	       rn, probeLWP_ID);

    /*
     * Return the final results.
     */
    if (conn_err)
	return(-2);
    else
	return(0);

} /*xstat_cm_Init*/


/*------------------------------------------------------------------------
 * [exported] xstat_cm_ForceProbeNow
 *
 * Description:
 *	Wake up the probe LWP, forcing it to execute a probe immediately.
 *
 * Arguments:
 *	None.
 *
 * Returns:
 *	0 on success,
 *	Error value otherwise.
 *
 * Environment:
 *	The module must have been initialized.
 *
 * Side Effects:
 *	As advertised.
 *------------------------------------------------------------------------*/

int xstat_cm_ForceProbeNow()

{ /*xstat_cm_ForceProbeNow*/

    static char rn[] = "xstat_cm_ForceProbeNow";	/*Routine name*/

    /*
     * There isn't a prayer unless we've been initialized.
     */
    if (!xstat_cm_initflag) {
	fprintf(stderr, "[%s] Must call xstat_cm_Init first!\n", rn);
	return(-1);
    }

    /*
     * Kick the sucker in the side.
     */
    IOMGR_Cancel(probeLWP_ID);

    /*
     * We did it, so report the happy news.
     */
    return(0);

} /*xstat_cm_ForceProbeNow*/
