[torqueusers] Not Running: Not enough memory available
Carlos López
natorro at fisica.unam.mx
Thu Aug 28 12:20:07 MDT 2008
Hi! :-) I can´t seem to find how to solve the next problem...
I have a 10 node cluster with 2 GB of RAM in each node and 2 processors,
I configured my next queues:
------
create queue medium
set queue medium queue_type = Execution
set queue medium max_user_queuable = 20
set queue medium max_running = 20
set queue medium acl_hosts =
ollin+ollin-1+ollin-2+ollin-3+ollin-4+ollin-5+ollin-6+ollin-7+ollin-8+ollin-9+ollin-10
set queue medium resources_max.cput = 240:00:00
set queue medium resources_max.mem = 20000mb
set queue medium resources_default.cput = 240:00:00
set queue medium resources_default.walltime = 240:00:00
set queue medium max_user_run = 20
set queue medium enabled = True
set queue medium started = True
create queue prueba
set queue prueba queue_type = Execution
set queue prueba max_user_queuable = 20
set queue prueba max_running = 20
set queue prueba acl_hosts =
ollin+ollin-1+ollin-2+ollin-3+ollin-4+ollin-5+ollin-6+ollin-7+ollin-8+ollin-9+ollin-10
set queue prueba resources_max.cput = 02:00:00
set queue prueba resources_max.mem = 20000mb
set queue prueba resources_default.cput = 02:00:00
set queue prueba resources_default.walltime = 02:00:00
set queue prueba max_user_run = 20
set queue prueba enabled = True
set queue prueba started = True
create queue long
set queue long queue_type = Execution
set queue long max_user_queuable = 20
set queue long max_running = 20
set queue long acl_hosts =
ollin+ollin-1+ollin-2+ollin-3+ollin-4+ollin-5+ollin-6+ollin-7+ollin-8+ollin-9+ollin-10
set queue long resources_max.cput = 720:00:00
set queue long resources_max.mem = 20000mb
set queue long resources_default.cput = 720:00:00
set queue long resources_default.walltime = 720:00:00
set queue long max_user_run = 20
set queue long enabled = True
set queue long started = True
create queue short
set queue short queue_type = Execution
set queue short max_user_queuable = 20
set queue short max_running = 20
set queue short acl_hosts =
ollin+ollin-1+ollin-2+ollin-3+ollin-4+ollin-5+ollin-6+ollin-7+ollin-8+ollin-9+ollin-10
set queue short resources_max.cput = 48:00:00
set queue short resources_max.mem = 20000mb
set queue short resources_default.cput = 48:00:00
set queue short resources_default.walltime = 48:00:00
set queue short max_user_run = 20
set queue short enabled = True
set queue short started = True
set server scheduling = True
set server max_running = 40
set server operators = root at ollin.fisica.unam.mx
set server default_queue = medium
set server log_events = 511
set server mail_from = adm
set server query_other_jobs = True
set server resources_available.ncpus = 22
set server resources_available.nodect = 11
set server resources_available.nodes = 11
set server resources_default.nodes = 1
set server scheduler_iteration = 60
set server node_check_rate = 150
set server tcp_timeout = 6
set server node_pack = False
set server log_level = 1
set server pbs_version = 2.2.1
------------
I sent an script job with qsub, wich was:
--------
#!/bin/tcsh
#PBS -q long
cd /home/abl/2009-1/mp1
w2web
runsp_lapw -ec 0.0001 -i 100 -NI
--------
now I try to send one more wich is:
-------
#!/bin/tcsh
#PBS -q
long
cd /home/abl/2009-1/delta_012/mp1
w2web
runsp_lapw -ec 0.0001 -i 100 -NI
---------
and when I check it with qstat -f it says:
comment = Not Running: Not enough memory available
As long as I know, this program uses at most 400 MB of RAM, why is it
not working? :-( can anybody give me a hand with this???
Thank you very much
Carlos
--
This message has been scanned for viruses and
dangerous content by MailScanner, and is
believed to be clean.
More information about the torqueusers
mailing list