// @(#)root/proof:$Name: $:$Id: TCondor.cxx,v 1.2 2003/07/05 18:18:46 brun Exp $
// Author: Maarten Ballintijn 06/12/03
/*************************************************************************
* Copyright (C) 1995-2001, Rene Brun and Fons Rademakers. *
* All rights reserved. *
* *
* For the licensing terms see $ROOTSYS/LICENSE. *
* For the list of contributors see $ROOTSYS/README/CREDITS. *
*************************************************************************/
//////////////////////////////////////////////////////////////////////////
// //
// TCondor //
// //
// Interface to the Condor system. TCondor provides a (partial) API for //
// querying and controlling the Condor system, including experimental //
// extensions like COD (computing on demand) //
// //
//////////////////////////////////////////////////////////////////////////
#include "TCondor.h"
#include "TList.h"
#include "TSystem.h"
#include "TObjString.h"
#include "TRegexp.h"
ClassImp(TCondorSlave)
ClassImp(TCondor)
//______________________________________________________________________________
TCondor::TCondor(const char *pool) : fPool(pool), fState(kFree)
{
// Create Condor interface object. Uses Condor apps since there is no
// API yet.
fClaims = new TList;
// hack our path :-/
TString path = gSystem->Getenv("PATH");
path = "/opt/vdt/bin:" + path;
gSystem->Setenv("PATH",path);
gSystem->Setenv("CONDOR_CONFIG","/opt/vdt/etc/condor_config");
}
//______________________________________________________________________________
TCondor::~TCondor()
{
// Cleanup Condor interface.
Info("~TCondor","fState %d", fState );
if (fState != kFree) {
Release();
}
delete fClaims;
}
//______________________________________________________________________________
void TCondor::Print(Option_t *) const
{
}
//______________________________________________________________________________
TCondorSlave *TCondor::ClaimVM(const char *vm, const char *cmd, Int_t &port)
{
// Claim a VirtualMachine for PROOF usage.
TString claimCmd = Form("condor_cod request -name %s -timeout 10", vm );
Info("ClaimVM","command: %s", claimCmd.Data());
FILE *pipe = gSystem->OpenPipe(claimCmd, "r");
if (!pipe) {
SysError("ClaimVM","cannot run command: %s", claimCmd.Data());
return 0;
}
char buf[1024];
TString claimId;
while (!feof(pipe) && !ferror(pipe)) {
TString line;
do {
if (fgets(buf, sizeof(buf), pipe) == 0) break;
line += buf;
} while (!ferror(pipe) && !feof(pipe) && strchr(buf,'n') == 0);
if (line.EndsWith("n")) line.Chop();
// Info("ClaimVM","Claim: line = %s", line.Data());
if (line.BeginsWith("ClaimId = "")) {
line.Remove(0, line.Index(""")+1);
line.Chop(); // remove trailing "
claimId = line;
Info("ClaimVM","claim = '%s'", claimId.Data());
// for the moment hard coded by caller
// TRegexp r("[0-9]*$");
// TString num = line(r);
// port = 37000 + atoi(num.Data());
}
}
Int_t r = gSystem->ClosePipe(pipe);
Info("ClaimVM","command: %s returned %d", claimCmd.Data(), r);
TString host = claimId(TRegexp("<.*>"));
TString activateCmd = Form("condor_cod activate -addr '%s' -id '%s' -keyword COD_PROOF_%d",
host.Data(), claimId.Data(), port );
pipe = gSystem->OpenPipe(activateCmd, "r");
if (!pipe) {
SysError("ClaimVM","cannot run command: %s", activateCmd.Data());
return 0;
}
while (!feof(pipe) && !ferror(pipe)) {
TString line;
do {
if (fgets(buf, sizeof(buf), pipe) == 0) break;
line += buf;
} while (!ferror(pipe) && !feof(pipe) && strchr(buf,'n') == 0);
if (line.EndsWith("n")) line.Chop();
Info("ClaimVM","Activate: line = %s", line.Data());
}
r = gSystem->ClosePipe(pipe);
Info("ClaimVM","command: %s returned %d", activateCmd.Data(), r);
// TODO: get info at the start for all nodes ...
TCondorSlave *claim = new TCondorSlave;
claim->fClaimID = claimId;
TString node(vm);
node = node.Remove(0, node.Index("@")+1);
claim->fHostname = node;
claim->fPort = port;
GetVmInfo(vm, claim->fImage, claim->fPerfIdx);
return claim;
}
//______________________________________________________________________________
TList *TCondor::GetVirtualMachines() const
{
// Get the names of the virtual machines in the pool.
// Return a TList of TObjString or 0 in case of failure
TString poolopt = fPool ? "" : Form("-pool %s", fPool.Data());
TString cmd = Form("condor_status %s -format "%%s\n" Name", poolopt.Data());
Info("GetVirtualMachines","command: %s", cmd.Data());
FILE *pipe = gSystem->OpenPipe(cmd, "r");
if (!pipe) {
SysError("GetVirtualMachines","cannot run command: %s", cmd.Data());
return 0;
}
char buf[1024];
TList *l = new TList;
while (!feof(pipe) && !ferror(pipe)) {
TString line;
do {
if (fgets(buf, sizeof(buf), pipe) == 0) break;
line += buf;
} while (!ferror(pipe) && !feof(pipe) && strchr(buf,'n') == 0);
if (line.EndsWith("n")) line.Chop();
if (line != "") l->Add(new TObjString(line));
}
Int_t r = gSystem->ClosePipe(pipe);
Info("GetVirtualMachines","command: %s returned %d", cmd.Data(), r);
return l;
}
//______________________________________________________________________________
TList *TCondor::Claim(Int_t n, const char *cmd)
{
if (fState != kFree) {
Error("Claim","not in state Free");
return 0;
}
TList *vms = GetVirtualMachines();
TIter next(vms);
TObjString *vm;
for(Int_t i=0; i < n && (vm = (TObjString*) next()) != 0; i++ ) {
Int_t port = 17000+i; // hard code port for the moment
TCondorSlave *claim = ClaimVM(vm->GetName(), cmd, port);
if (claim != 0) {
fClaims->Add(claim);
}
}
fState = kActive;
return fClaims;
}
//______________________________________________________________________________
Bool_t TCondor::SetState(EState state)
{
TIter next(fClaims);
TCondorSlave *claim;
while((claim = (TCondorSlave*) next()) != 0) {
TString host = claim->fClaimID(TRegexp("<.*>"));
TString cmd = Form("condor_cod %s -addr '%s' -id '%s'",
state == kSuspended ? "suspend" : "resume",
host.Data(), claim->fClaimID.Data());
FILE *pipe = gSystem->OpenPipe(cmd, "r");
if (!pipe) {
SysError("SetState","cannot run command: %s", cmd.Data());
return kFALSE;
}
char buf[1024];
while (!feof(pipe) && !ferror(pipe)) {
TString line;
do {
if (fgets(buf, sizeof(buf), pipe) == 0) break;
line += buf;
} while (!ferror(pipe) && !feof(pipe) && strchr(buf,'n') == 0);
if (line.EndsWith("n")) line.Chop();
Info("SetState","line = %s", line.Data());
}
Int_t r = gSystem->ClosePipe(pipe);
Info("SetState","command: %s returned %d", cmd.Data(), r);
}
fState = state;
return kTRUE;
}
//______________________________________________________________________________
Bool_t TCondor::Suspend()
{
if (fState != kActive) {
Error("Suspend","not in state Active");
return kFALSE;
}
return SetState(kSuspended);
}
//______________________________________________________________________________
Bool_t TCondor::Resume()
{
if (fState != kSuspended) {
Error("Suspend","not in state Suspended");
return kFALSE;
}
return SetState(kActive);
}
//______________________________________________________________________________
Bool_t TCondor::Release()
{
if (fState == kFree) {
Error("Suspend","not in state Active or Suspended");
return kFALSE;
}
TCondorSlave *claim;
while((claim = (TCondorSlave*) fClaims->First()) != 0) {
TString host = claim->fClaimID(TRegexp("<.*>"));
TString cmd = Form("condor_cod release -addr '%s' -id '%s'", host.Data(), claim->fClaimID.Data());
FILE *pipe = gSystem->OpenPipe(cmd, "r");
if (!pipe) {
SysError("Release","cannot run command: %s", cmd.Data());
return kFALSE;
}
char buf[1024];
while (!feof(pipe) && !ferror(pipe)) {
TString line;
do {
if (fgets(buf, sizeof(buf), pipe) == 0) break;
line += buf;
} while (!ferror(pipe) && !feof(pipe) && strchr(buf,'n') == 0);
if (line.EndsWith("n")) line.Chop();
Info("Release","line = %s", line.Data());
}
Int_t r = gSystem->ClosePipe(pipe);
Info("Release","command: %s returned %d", cmd.Data(), r);
fClaims->Remove(claim);
delete claim;
}
fState = kFree;
return kTRUE;
}
//______________________________________________________________________________
Bool_t TCondor::GetVmInfo(const char *vm, TString &image, Int_t &perfidx) const
{
TString cmd = Form("condor_status -format "%%d:" Mips -format "%%s\n" FileSystemDomain "
"-const 'Name=="%s"'", vm);
Info("GetVmInfo","command: %s", cmd.Data());
FILE *pipe = gSystem->OpenPipe(cmd, "r");
if (!pipe) {
SysError("GetVmInfo","cannot run command: %s", cmd.Data());
return 0;
}
char buf[1024];
while (!feof(pipe) && !ferror(pipe)) {
TString line;
do {
if (fgets(buf, sizeof(buf), pipe) == 0) break;
line += buf;
} while (!ferror(pipe) && !feof(pipe) && strchr(buf,'n') == 0);
if (line.EndsWith("n")) line.Chop();
if (line != "") {
Info("GetVmInfo","line = %s", line.Data());
TString amips = line(TRegexp("^[0-9]*"));
perfidx = atoi(amips);
image = line(TRegexp("[^:]+$"));
break;
}
}
Int_t r = gSystem->ClosePipe(pipe);
Info("GetVmInfo","command: %s returned %d", cmd.Data(), r);
return kTRUE;
}
//______________________________________________________________________________
TString TCondor::GetImage(const char *host) const
{
TString cmd = Form("condor_status -direct %s -format "Image:%%s\n" "
"FileSystemDomain", host);
Info("GetImage","command: %s", cmd.Data());
FILE *pipe = gSystem->OpenPipe(cmd, "r");
if (!pipe) {
SysError("GetImage","cannot run command: %s", cmd.Data());
return 0;
}
char buf[1024];
TString image;
while (!feof(pipe) && !ferror(pipe)) {
TString line;
do {
if (fgets(buf, sizeof(buf), pipe) == 0) break;
line += buf;
} while (!ferror(pipe) && !feof(pipe) && strchr(buf,'n') == 0);
if (line.EndsWith("n")) line.Chop();
if (line != "") {
Info("GetVmInfo","line = %s", line.Data());
image = line(TRegexp("[^:]+$"));
break;
}
}
Int_t r = gSystem->ClosePipe(pipe);
Info("GetVmInfo","command: %s returned %d", cmd.Data(), r);
return image;
}
ROOT page - Class index - Top of the page
This page has been automatically generated. If you have any comments or suggestions about the page layout send a mail to ROOT support, or contact the developers with any questions or problems regarding ROOT.