On Fri, 2005-04-08 at 09:59, Dennis Hsu wrote:
After installing, I modified three attributes in condor_config as following:
DAEMON_LIST = MASTER, STARTD, SCHEDD, NEGOTIATOR, COLLECTOR
On condor_config
DAEMON_LIST = MASTER, STARTD, SCHEDD
and on the local configuration file of master define this:
DAEMON_LIST = MASTER, COLLECTOR, NEGOTIATOR, STARTD, SCHEDD
NUM_CPUS=1
NUM_CPUS = 1 u have to define this in local configuration file of each machine Although it is not required to change it
MEMORY=256
MEMORY = 128 u have to define this in local configuration file of each machine
And then stop the condor_master and then start it back.
Well Actually you have to start the startd daemin actually but to avoid the confusion you better stop and then start the condor_master on all the server and then submit the job and then see what is say.
I have submitted loop.cmd and io.cmd, but they are in idle status.
Then I run condor_q -analyze and find that they do not meet some requirements.
What is that means?
I need your help.
Thank you!
------------------------------------------------------------------------------------------------------
[condor@grid examples]$ condor_status
Name OpSys Arch State Activity LoadAv Mem ActvtyTime
cluster_101.a LINUX INTEL Owner Idle 0.000 256 0+00:49:45
cluster_102.a LINUX INTEL Owner Idle 0.000 256[?????]
cluster_103.a LINUX INTEL Owner Idle 0.000 256 0+00:49:44
vm1@xxxxxxxxx LINUX INTEL Owner Idle 0.000 128 0+01:20:10
vm2@xxxxxxxxx LINUX INTEL Owner Idle 0.000 128 0+01:20:11
Machines Owner Claimed Unclaimed Matched Preempting
INTEL/LINUX 5 5 0 0 0 0
Total 5 5 0 0 0 0
------------------------------------------------------------------------------------------------------
[root@grid hosts]# condor_q
-- Submitter: grid.ancad.com : <192.168.10.244:32853> : grid.ancad.com
ID OWNER SUBMITTED RUN_TIME ST PRI SIZE CMD
2.0 condor 4/8 11:36 0+00:00:00 I 0 11.7 loop.remote 200
2.1 condor 4/8 11:36 0+00:00:00 I 0 11.7 loop.remote 200
2.2 condor 4/8 11:36 0+00:00:00 I 0 11.7 loop.remote 300
2.3 condor 4/8 11:36 0+00:00:00 I 0 11.7 loop.remote 300
2.4 condor 4/8 11:36 0+00:00:00 I 0 11.7 loop.remote 500
4.0 condor 4/8 11:47 0+00:00:00 I 0 11.7 io.remote 200
6 jobs; 6 idle, 0 running, 0 held
------------------------------------------------------------------------------------------------------
[condor@grid examples]$ condor_q -analyze 2.0
-- Submitter: grid.ancad.com : <192.168.10.244:32853> : grid.ancad.com
ID OWNER SUBMITTED RUN_TIME ST PRI SIZE CMD
---
002.000: Run analysis summary. Of 5 machines,
0 are rejected by your job's requirements
5 reject your job because of their own requirements
0 match, but are serving users with a better priority in the pool
0 match, match, but reject the job for unknown reasons
0 match, but will not currently preempt their existing job
0 are available to run your job
WARNING: Be advised: Request 2.0 did not match any resource's constraints
------------------------------------------------------------------------------------------------------
[condor@grid examples]$ condor_status -l grid.ancad.com
MyType = "Machine"
TargetType = "Job"
Name = "vm1@xxxxxxxxxxxxxx"
Machine = "grid.ancad.com"
Rank = 0.000000
CpuBusy = ((LoadAvg - CondorLoadAvg) >= 0.500000)
COLLECTOR_HOST_STRING = "grid.ancad.com"
CondorVersion = "$CondorVersion: 6.6.9 Mar 10 2005 $"
CondorPlatform = "$CondorPlatform: I386-LINUX_RH9 $"
VirtualMachineID = 1
VirtualMemory = 0
Disk = 16146864
CondorLoadAvg = 0.000000
LoadAvg = 0.000000
KeyboardIdle = 0
ConsoleIdle = 0
Memory = 128
Cpus = 1
StartdIpAddr = "<192.168.10.244:33004>"
Arch = "INTEL"
OpSys = "LINUX"
UidDomain = "grid.ancad.com"
FileSystemDomain = "grid.ancad.com"
Subnet = "192.168.10"
HasIOProxy = TRUE
TotalVirtualMemory = 0
TotalDisk = 32293728
KFlops = 762963
Mips = 1581
LastBenchmark = 1112929477
TotalLoadAvg = 0.000000
TotalCondorLoadAvg = 0.000000
ClockMin = 699
ClockDay = 5
TotalVirtualMachines = 2
HasFileTransfer = TRUE
HasMPI = TRUE
HasJICLocalConfig = TRUE
HasJICLocalStdin = TRUE
JavaVendor = "Sun Microsystems Inc."
JavaVersion = "1.4.2_07"
JavaMFlops = 182.734146
HasJava = TRUE
HasPVM = TRUE
HasRemoteSyscalls = TRUE
HasCheckpointing = TRUE
StarterAbilityList = "HasFileTransfer,HasMPI,HasJICLocalConfig,HasJICLocalStdin,HasJava,HasPVM,HasRemoteSyscalls,HasCheckpointing"
CpuBusyTime = 0
CpuIsBusy = FALSE
State = "Owner"
EnteredCurrentState = 1112929471
Activity = "Idle"
EnteredCurrentActivity = 1112929471
Start = ((KeyboardIdle > 15 * 60) && (((LoadAvg - CondorLoadAvg) <= 0.300000) || (State != "Unclaimed" && State != "Owner")))
Requirements = START
CurrentRank = 0.000000
DaemonStartTime = 1112929470
UpdateSequenceNumber = 7
MyAddress = "<192.168.10.244:33004>"
LastHeardFrom = 1112931581
UpdatesTotal = 8
UpdatesSequenced = 7
UpdatesLost = 0
UpdatesHistory = "0x00000000000000000000000000000000"
MyType = "Machine"
TargetType = "Job"
Name = "vm2@xxxxxxxxxxxxxx"
Machine = "grid.ancad.com"
Rank = 0.000000
CpuBusy = ((LoadAvg - CondorLoadAvg) >= 0.500000)
COLLECTOR_HOST_STRING = "grid.ancad.com"
CondorVersion = "$CondorVersion: 6.6.9 Mar 10 2005 $"
CondorPlatform = "$CondorPlatform: I386-LINUX_RH9 $"
VirtualMachineID = 2
VirtualMemory = 0
Disk = 16146864
CondorLoadAvg = 0.000000
LoadAvg = 0.000000
KeyboardIdle = 0
ConsoleIdle = 0
Memory = 128
Cpus = 1
StartdIpAddr = "<192.168.10.244:33004>"
Arch = "INTEL"
OpSys = "LINUX"
UidDomain = "grid.ancad.com"
FileSystemDomain = "grid.ancad.com"
Subnet = "192.168.10"
HasIOProxy = TRUE
TotalVirtualMemory = 0
TotalDisk = 32293728
KFlops = 762963
Mips = 1581
LastBenchmark = 1112929477
TotalLoadAvg = 0.000000
TotalCondorLoadAvg = 0.000000
ClockMin = 699
ClockDay = 5
TotalVirtualMachines = 2
HasFileTransfer = TRUE
HasMPI = TRUE
HasJICLocalConfig = TRUE
HasJICLocalStdin = TRUE
JavaVendor = "Sun Microsystems Inc."
JavaVersion = "1.4.2_07"
JavaMFlops = 182.734146
HasJava = TRUE
HasPVM = TRUE
HasRemoteSyscalls = TRUE
HasCheckpointing = TRUE
StarterAbilityList = "HasFileTransfer,HasMPI,HasJICLocalConfig,HasJICLocalStdin,HasJava,HasPVM,HasRemoteSyscalls,HasCheckpointing"
CpuBusyTime = 0
CpuIsBusy = FALSE
State = "Owner"
EnteredCurrentState = 1112929471
Activity = "Idle"
EnteredCurrentActivity = 1112929471
Start = ((KeyboardIdle > 15 * 60) && (((LoadAvg - CondorLoadAvg) <= 0.300000) || (State != "Unclaimed" && State != "Owner")))
Requirements = START
CurrentRank = 0.000000
DaemonStartTime = 1112929470
UpdateSequenceNumber = 7
MyAddress = "<192.168.10.244:33004>"
LastHeardFrom = 1112931582
UpdatesTotal = 8
UpdatesSequenced = 7
UpdatesLost = 0
UpdatesHistory = "0x00000000000000000000000000000000"
------------------------------------------------------------------------------------------------------
Best Regards,
Dennis Hsu
--------------------------
AnCAD Inc.
5F, No. 67, Sec. 1, Yonghe Rd.,
Yonghe City, Tapei County, 234
Taiwan
_______________________________________________
Condor-users mailing list
Condor-users@xxxxxxxxxxx
https://lists.cs.wisc.edu/mailman/listinfo/condor-users
|