Differences

This shows you the differences between two versions of the page.

--- condor:installation:configuration [2011/07/14 13:53] – created, configuration files added garrettheath4
+++ condor:installation:configuration [2011/07/28 19:14] – garrettheath4
@@ Line 1: / Line 1: @@
-====== Post-Install Configuration ======
+======Condor Configuration Files======
+This page contains copies of the configuration files we use on our system.  Use the table of contents to the right to jump to a specific configuration file.
-===== Global Configuration File =====
+=====Global Configuration File=====
-<file autoconf condor_config>######################################################################
+<file autoconf condor_config_global>######################################################################
 ##
 ##  condor_config
@@ Line 55: / Line 56: @@
 ##  Pathnames:
 ##--------------------------------------------------------------------
+##  Where are all of the Condor-related files stored for the entire
+##  Condor system?
+CondorDir		= /mnt/config
 ##  Where have you installed the bin, sbin and lib condor directories?
-RELEASE_DIR		= /usr/local/condor
+RELEASE_DIR		= $(CondorDir)/release/x86_64_rhap_5
 ##  Where is the local condor directory for each host?
 ##  This is where the local config file(s), logs and
 ##  spool/execute directories are located
-LOCAL_DIR		= $(TILDE)
+LOCAL_DIR		= $(CondorDir)/hosts/$(FULL_HOSTNAME)
-#LOCAL_DIR		= $(RELEASE_DIR)/hosts/$(HOSTNAME)
 ##  Where is the machine-specific local config file for each host?
-LOCAL_CONFIG_FILE = /var/lib/condor/condor_config.local
+#LOCAL_CONFIG_FILE = $(LOCAL_DIR)/condor_config.local
+# If this computer is the Condor Central Manager, load the central
+# manager/master config file.  Otherwise, load the worker config file.
+#LOCAL_CONFIG_FILE = ifThenElse($(FULL_HOSTNAME)=?=$(CondorHost_RealName),$(CondorDir)/hosts/condor_config_manager.local,$(CondorDir)/hosts/condor_config_worker.local)
 ##  Where are optional machine-specific local config files located?
 ##  Config files are included in lexicographic order.
 LOCAL_CONFIG_DIR	= $(LOCAL_DIR)/config
-#LOCAL_CONFIG_DIR	= $(LOCAL_DIR)/config
 ## Blacklist for file processing in the LOCAL_CONFIG_DIR
@@ Line 78: / Line 85: @@
 ## WARNING: This is a potential security issue.
 ## If not specificed, the default is True
-#REQUIRE_LOCAL_CONFIG_FILE = TRUE
+REQUIRE_LOCAL_CONFIG_FILE = TRUE
 ##--------------------------------------------------------------------
@@ Line 105: / Line 112: @@
 ##  to specify that each machine has its own file system.
 FILESYSTEM_DOMAIN	= cs.wlu.edu
+## What machine is your central manager?
+CONDOR_HOST = john.cs.wlu.edu
+# "condor.cs.wlu.edu" is just an alias.  What does the central
+# manager call itself?  That is, what does `hostname` return?
+CondorHost_RealName = $(CONDOR_HOST)
 ##  This macro is used to specify a short description of your pool.
@@ Line 131: / Line 144: @@
 ##  (this can also be specified in the environment)
 ##  Note: the CONDOR_IDS setting is ignored on Win32 platforms
-#CONDOR_IDS=x.x
+# NOTE: CONDOR_IDS is defined in the machine-specific configuration files
+#CONDOR_IDS=1344.1610
 ##--------------------------------------------------------------------
@@ Line 142: / Line 156: @@
 ##
 ##  To flock to others, define FLOCK_TO.
+## Join the W&L CS Pool (Orion)
+# Designate which machines are members of this pool.
+# NOTE: In order to make it easy to automatically change this variable when
+#       running the installation script, the "PoolMembers" variable and its
+#       value should all be on one line (no line breaks).
+PoolMembers = john.cs.wlu.edu, carl.cs.wlu.edu, fred.cs.wlu.edu, babbage.cs.wlu.edu
 ##  FLOCK_FROM defines the machines where you would like to grant
 ##  people access to your pool via flocking. (i.e. you are granting
 ##  access to these machines to join your pool).
-FLOCK_FROM = *.cs.wlu.edu
+FLOCK_FROM = $(PoolMembers)
 ##  An example of this is:
 #FLOCK_FROM = somehost.friendly.domain, anotherhost.friendly.domain
@@ Line 154: / Line 175: @@
 ##  want your jobs to be negotiated at -- thereby specifying the
 ##  pools they will run in.)
-FLOCK_TO =
+FLOCK_TO = $(CONDOR_HOST)
 ##  An example of this is:
 #FLOCK_TO = central_manager.friendly.domain, condor.cs.wisc.edu
@@ Line 176: / Line 197: @@
 ##  Please see the administrator's manual for details on these
 ##  settings, what they're for, and how to use them.
+# Define fully-qualified usernames for users' right definitions
+CondorUsers = condor@$(UID_DOMAIN)/john.cs.wlu.edu, \
+              condor@$(UID_DOMAIN)/carl.cs.wlu.edu, \
+              condor@$(UID_DOMAIN)/fred.cs.wlu.edu
+AdminUsers = koller@$(UID_DOMAIN)/$(CONDOR_HOST)
+RootUsers = root@$(UID_DOMAIN)/john.cs.wlu.edu, \
+            root@$(UID_DOMAIN)/carl.cs.wlu.edu, \
+            root@$(UID_DOMAIN)/fred.cs.wlu.edu
 ##  What machines have administrative rights for your pool?  This
@@ Line 182: / Line 212: @@
 ##  (assuming you trust all the users who log into that/those
 ##  machine(s), since this is machine-wide access you're granting).
-ALLOW_ADMINISTRATOR = $(CONDOR_HOST)
+ALLOW_ADMINISTRATOR = $(AdminUsers)
 ##  If there are no machines that should have administrative access
@@ Line 208: / Line 238: @@
 ##  you install, configure or debug your Condor installation.
 ##  It is important to have this defined.
-ALLOW_READ = *.cs.wlu.edu
+ALLOW_READ = $(AdminUsers), $(CondorUsers), *@cs.wlu.edu/*.cs.wlu.edu, \
+             *.cs.wisc.edu
 #ALLOW_READ = *.your.domain, *.cs.wisc.edu
 #DENY_READ = *.bad.subnet, bad-machine.your.domain, 144.77.88.*
@@ Line 224: / Line 255: @@
 ##  machines to your pool and is a serious security risk.
-ALLOW_WRITE = $(FULL_HOSTNAME), $(IP_ADDRESS)
+ALLOW_WRITE = $(AdminUsers), $(CondorUsers), \
+              *@cs.wlu.edu/*.cs.wlu.edu
 #ALLOW_WRITE = *.your.domain, your-friend's-machine.other.domain
 #DENY_WRITE = bad-machine.your.domain
@@ Line 241: / Line 273: @@
 ##  Negotiator access.  Machines listed here are trusted central
 ##  managers.  You should normally not have to change this.
+#ALLOW_NEGOTIATOR = condor@$(CONDOR_HOST)/$(CONDOR_HOST)
 ALLOW_NEGOTIATOR = $(CONDOR_HOST)
 ##  Now, with flocking we need to let the SCHEDD trust the other
@@ Line 251: / Line 284: @@
 ##  access should only be granted with extreme caution.  By default,
 ##  config access is denied from all hosts.
-#ALLOW_CONFIG = trusted-host.your.domain
+ALLOW_CONFIG = $(AdminUsers)
+## Daemon Access added by Garrett Koller (not in default config file)
+##  Daemon access.  Machines listed here are allowed to communicate
+##  with the daemons of "this" machine.  Requests from the following
+##  machines will be acknowledged and appropriate responses will be sent.
+#ALLOW_DAEMON = $(CondorUsers), $(FULL_HOSTNAME), $(RootUsers)
+ALLOW_DAEMON = $(PoolMembers)
+## Client Access added by Garrett Koller (not in default config file)
+##  Client access.  "When I am acting as a client, these are the servers
+##  I allow or deny."
+ALLOW_CLIENT = $(PoolMembers)
 ##  Flocking Configs.  These are the real things that Condor looks at,
@@ Line 260: / Line 305: @@
 ALLOW_READ_COLLECTOR  = $(ALLOW_READ), $(FLOCK_FROM)
 ALLOW_READ_STARTD     = $(ALLOW_READ), $(FLOCK_FROM)
+# Clear out any old-style HOSTALLOW settings:
+HOSTALLOW_READ =
+HOSTALLOW_WRITE =
+HOSTALLOW_DAEMON =
+HOSTALLOW_NEGOTIATOR =
+HOSTALLOW_ADMINISTRATOR =
+HOSTALLOW_OWNER =
+##--------------------------------------------------------------------
+##  Authentication
+##--------------------------------------------------------------------
+## Authentication added by Garrett Koller (not in default config file)
+##  These parameters define how Condor will know whether or not a
+##  machine that attempts to communicate with it is who it says it is.
+##  Refer to Section 3.6.3 "Authentication" of the Condor
+##  documentation for more information
+# A client processess (run by a normal user on a machine that may or
+# may not have Condor installed, such as condor_submit) or another
+# Condor daemon (either running locally or remotely) will offer these
+# authentication methods when trying to communicate with the Condor
+# system daemons.
+SEC_CLIENT_AUTHENTICATION = PREFERRED
+SEC_CLIENT_AUTHENTICATION_METHODS = PASSWORD, FS, FS_REMOTE
+SEC_CLIENT_INTEGRITY = OPTIONAL
+# A daemon will accept these forms of authentication when
+# communicating
+SEC_DEFAULT_AUTHENTICATION = PREFERRED
+SEC_DEFAULT_AUTHENTICATION_METHODS = PASSWORD, FS, FS_REMOTE
+SEC_DEFAULT_INTEGRITY = OPTIONAL
+# Password authentication
+# Note: TILDE refers to the 'condor' user's home directory.
+SEC_PASSWORD_FILE = $(TILDE)/pool_password
+FS_REMOTE_DIR = $(CondorDir)/scratch
+SEC_ADMINISTRATOR_AUTHENTICATION = REQUIRED
+SEC_CONFIG_AUTHENTICATION = REQUIRED
+SEC_READ_AUTHENTICATION = OPTIONAL
@@ Line 277: / Line 363: @@
 ## uncomment the following setting and change the value to "True".
 ## Note: changing this requires a restart not just a reconfig.
-#ENABLE_RUNTIME_CONFIG = False
+ENABLE_RUNTIME_CONFIG = True
 ## Do you want to allow condor_config_val -set to work at all?
@@ Line 283: / Line 369: @@
 ## uncomment the following setting and change the value to "True".
 ## Note: changing this requires a restart not just a reconfig.
-#ENABLE_PERSISTENT_CONFIG = False
+ENABLE_PERSISTENT_CONFIG = False
 ## Directory where daemons should write persistent config files (used
@@ Line 297: / Line 383: @@
 ##  prior to version 6.3.3.  If you don't need this behavior, you
 ##  should leave this commented out.
-#SETTABLE_ATTRS_CONFIG = *
+SETTABLE_ATTRS_CONFIG = *
 ##  Attributes that can be set by hosts with "ADMINISTRATOR"
@@ Line 326: / Line 412: @@
 ##  Do you want to use NFS for file access instead of remote system
 ##  calls?
-#USE_NFS		= False
+USE_NFS		= True
 ##  Do you want to use AFS for file access instead of remote system
@@ Line 339: / Line 425: @@
 ##  False, checkpoints will be written to the local SPOOL directory on
 ##  the submission machine.
-#USE_CKPT_SERVER	= True
+USE_CKPT_SERVER	= False
 ##  What's the hostname of this machine's nearest checkpoint server?
@@ Line 369: / Line 455: @@
 ## Assume we can use up to 80% of memory and estimate shadow private data
 ## size of 800k.
-#MAX_SHADOWS_MEM	= ceiling($(DETECTED_MEMORY)*0.8*1024/800)
+MAX_SHADOWS_MEM	= ceiling($(DETECTED_MEMORY)*0.8*1024/800)
 ## Assume we can use ~21,000 ephemeral ports (avg ~2.1 per shadow).
 ## Under Linux, the range is set in /proc/sys/net/ipv4/ip_local_port_range.
-#MAX_SHADOWS_PORTS	= 10000
+MAX_SHADOWS_PORTS	= 10000
 ## Under windows, things are much less scalable, currently.
 ## Note that this can probably be safely increased a bit under 64-bit windows.
-#MAX_SHADOWS_OPSYS	= ifThenElse(regexp("WIN.*","$(OPSYS)"),200,100000)
+MAX_SHADOWS_OPSYS	= ifThenElse(regexp("WIN.*","$(OPSYS)"),200,100000)
 ## Now build up the expression for MAX_JOBS_RUNNING.  This is complicated
 ## due to lack of a min() function.
-#MAX_JOBS_RUNNING	= $(MAX_SHADOWS_MEM)
+MAX_JOBS_RUNNING	= $(MAX_SHADOWS_MEM)
-#MAX_JOBS_RUNNING	= \
+MAX_JOBS_RUNNING	= \
-#  ifThenElse( $(MAX_SHADOWS_PORTS) < $(MAX_JOBS_RUNNING), \
+  ifThenElse( $(MAX_SHADOWS_PORTS) < $(MAX_JOBS_RUNNING), \
-#              $(MAX_SHADOWS_PORTS), \
+              $(MAX_SHADOWS_PORTS), \
-#              $(MAX_JOBS_RUNNING) )
+              $(MAX_JOBS_RUNNING) )
-#MAX_JOBS_RUNNING	= \
+MAX_JOBS_RUNNING	= \
-#  ifThenElse( $(MAX_SHADOWS_OPSYS) < $(MAX_JOBS_RUNNING), \
+  ifThenElse( $(MAX_SHADOWS_OPSYS) < $(MAX_JOBS_RUNNING), \
-#              $(MAX_SHADOWS_OPSYS), \
+              $(MAX_SHADOWS_OPSYS), \
-#              $(MAX_JOBS_RUNNING) )
+              $(MAX_JOBS_RUNNING) )
@@ Line 411: / Line 497: @@
 ##  you've set in the CONDOR_IDS environment variable.  See the Admin
 ##  manual for details on this.
-LOCK		= $(LOG)
+LOCK		= /tmp/condor-lock
 ##  If you don't use a fully qualified name in your /etc/hosts file
@@ Line 429: / Line 515: @@
 ##  your top-level config file for this mode of operation to work
 ##  properly.
-#NO_DNS = True
+NO_DNS = False
 ##  Condor can be told whether or not you want the Condor daemons to
@@ Line 477: / Line 563: @@
 ##  default for this setting is False, since it is more secure this
 ##  way.
-#TRUST_UID_DOMAIN = False
+TRUST_UID_DOMAIN = False
 ## If you would like to be informed in near real-time via condor_q when
@@ Line 496: / Line 582: @@
 ## it being defined to False. Set it to True to allow the shadow to execute
 ## arbitrary shell code from the user job.
-#SHADOW_ALLOW_UNSAFE_REMOTE_EXEC = False
+SHADOW_ALLOW_UNSAFE_REMOTE_EXEC = False
 ## KEEP_OUTPUT_SANDBOX is an optional feature to tell Condor-G to not
@@ Line 546: / Line 632: @@
 ## The allowed values are case insensitive.
 ## The default of this parameter if not specified is: stm_use_schedd_only
-#SANDBOX_TRANSFER_METHOD = stm_use_schedd_only
+SANDBOX_TRANSFER_METHOD = stm_use_schedd_only
 ## This setting specifies an IP address that depends on the setting of
@@ Line 557: / Line 643: @@
 ## interface if one is available. If it cannot decide which of two interfaces
 ## to choose from, it will pick the first one.
-#NETWORK_INTERFACE =
+#BIND_ALL_INTERFACES = True
+#NETWORK_INTERFACE = eth0
 ##--------------------------------------------------------------------
@@ Line 567: / Line 654: @@
 ##
-ALL_DEBUG               =
+#TODO
+ALL_DEBUG               = D_SECURITY
 MAX_COLLECTOR_LOG	= 1000000
@@ Line 593: / Line 681: @@
 MASTER_DEBUG		=
 ##  When the master starts up, should it truncate it's log file?
-#TRUNC_MASTER_LOG_ON_OPEN        = False
+TRUNC_MASTER_LOG_ON_OPEN        = False
 MAX_JOB_ROUTER_LOG      = 1000000
@@ Line 621: / Line 709: @@
 ## instance of a daemon stopped running. This paramete controls how often
 ## the daemons touch the file (in seconds).
-#TOUCH_LOG_INTERVAL = 60
+TOUCH_LOG_INTERVAL = 300
 ######################################################################
@@ Line 679: / Line 767: @@
 JustCPU			= ($(CPUBusy) && ($(KeyboardBusy) == False))
 MachineBusy		= ($(CPUBusy) || $(KeyboardBusy))
+##  If job submitter user is listed here, give the job a high priority.
+GreedyUserRank =  (Owner == "stoughj") \
+                     + (Owner == "stough" * 10) \
+                     + (Owner == "koller") \
+                     + (Owner == "gkoller") \
+                     + (Owner == "nguyenp") \
+                     + (Owner == "davisl")
+IsGreedyUser   =  ($(GreedyUserRank) > 0)
 ##  The RANK expression controls which jobs this machine prefers to
@@ Line 687: / Line 785: @@
 ##  By default, RANK is always 0, meaning that all jobs have an equal
 ##  ranking.
-#RANK			= 0
+RANK			= $(GreedyUserRank) + ((TotalSlots > 1) * (SlotID / TotalSlots)) + ((KeyboardIdle > 15 * 60) * (5)) + (1 - LoadAvg)
@@ Line 705: / Line 803: @@
 # When should we only consider SUSPEND instead of PREEMPT?
-WANT_SUSPEND 		= $(UWCS_WANT_SUSPEND)
+#WANT_SUSPEND 		= $(UWCS_WANT_SUSPEND)
+WANT_SUSPEND 		= ( $(SmallJob) || $(KeyboardNotBusy) \
+                            || $(IsVanilla) ) \
+                          && ( $(SUSPEND) )
 # When should we preempt gracefully instead of hard-killing?
-WANT_VACATE		= $(UWCS_WANT_VACATE)
+#WANT_VACATE 		= $(UWCS_VACATE)
+WANT_VACATE		= ( $(ActivationTimer) > 10 * $(MINUTE) \
+                            || $(IsVanilla) )
 ##  When is this machine willing to start a job?
-START			= $(UWCS_START)
+#Note: START is redefined in the local config file of 'babbage.cs.wlu.edu'
+#START			= ($(UWCS_START) || $(IsGreedyUser))
+START			= ( $(CPUIdle) || \
+                            (State != "Unclaimed" && State != "Owner"))
 ##  When should a local universe job be allowed to start?
@@ Line 720: / Line 826: @@
 ##  When to suspend a job?
-SUSPEND			= $(UWCS_SUSPEND)
+#SUSPEND			= ($(UWCS_SUSPEND) && ($(IsGreedyUser) == False))
+SUSPEND			= ( (CpuBusyTime > 2 * $(MINUTE)) \
+                            && $(ActivationTimer) > 90 )
 ##  When to resume a suspended job?
-CONTINUE		= $(UWCS_CONTINUE)
+#CONTINUE		= ($(UWCS_CONTINUE) || $(IsGreedyUser))
+CONTINUE		= ( $(CPUIdle) && ($(ActivityTimer) > 5) )
 ##  When to nicely stop a job?
 ##  (as opposed to killing it instantaneously)
-PREEMPT			= $(UWCS_PREEMPT)
+#PREEMPT			= ($(UWCS_PREEMPT) && ($(IsGreedyUser) == False))
+PREEMPT			= ( ((Activity == "Suspended") && \
+                  ($(ActivityTimer) > $(MaxSuspendTime))) \
+		 || (SUSPEND && (WANT_SUSPEND == False)) )
 ##  When to instantaneously kill a preempting job
@@ Line 931: / Line 1043: @@
 LOG		= $(LOCAL_DIR)/log
 SPOOL		= $(LOCAL_DIR)/spool
-EXECUTE		= $(LOCAL_DIR)/execute
+#EXECUTE		= $(LOCAL_DIR)/execute
+# Note: TILDE refers to the 'condor' user's home directory.
+EXECUTE		= $(TILDE)/execute
 BIN		= $(RELEASE_DIR)/bin
 LIB		= $(RELEASE_DIR)/lib
@@ Line 971: / Line 1085: @@
 ## This attribute only takes effect on restart of the daemons or at the next
 ## update time.
-# LOCK_FILE_UPDATE_INTERVAL = 28800
+ LOCK_FILE_UPDATE_INTERVAL = 28800
 ##  This setting primarily allows you to change the port that the
@@ Line 989: / Line 1103: @@
 ##  How long are you willing to let daemons try their graceful
 ##  shutdown methods before they do a hard shutdown? (30 minutes)
-#SHUTDOWN_GRACEFUL_TIMEOUT	= 1800
+SHUTDOWN_GRACEFUL_TIMEOUT	= 1800
 ##  How much disk space would you like reserved from Condor?  In
@@ Line 995: / Line 1109: @@
 ##  partitions, it subtracts the amount it really finds by this
 ##  many megabytes.  (If undefined, defaults to 0).
-RESERVED_DISK		= 5
+RESERVED_DISK		= 50
 ##  If your machine is running AFS and the AFS cache lives on the same
@@ Line 1017: / Line 1131: @@
 ##  set to your domain, not $(FULL_HOSTNAME), and 2) email to
 ##  user@UID_DOMAIN won't work.
-#EMAIL_DOMAIN = $(FULL_HOSTNAME)
+EMAIL_DOMAIN = mail.wlu.edu
 ##  Should Condor daemons create a UDP command socket (for incomming
@@ Line 1056: / Line 1170: @@
 ## different port ranges for incoming and outgoing connections by
 ## using IN_HIGHPORT/IN_LOWPORT and OUT_HIGHPORT/OUT_LOWPORT.
-#HIGHPORT = 9700
+HIGHPORT = 9700
-#LOWPORT = 9600
+LOWPORT = 9600
 ##  If a daemon doens't respond for too long, do you want go generate
@@ Line 1073: / Line 1187: @@
 ##--------------------------------------------------------------------
 ##  Daemons you want the master to keep running for you:
-DAEMON_LIST			= MASTER, STARTD, SCHEDD
+# NOTE: DAEMON_LIST is defined in the local configuration files
+#DAEMON_LIST			= MASTER, STARTD, KBDD
 ##  Which daemons use the Condor DaemonCore library (i.e., not the
@@ Line 1118: / Line 1233: @@
 ##  If a daemon dies an unnatural death, do you want email about it?
-#PUBLISH_OBITUARIES		= True
+PUBLISH_OBITUARIES		= True
 ##  If you're getting obituaries, how many lines of the end of that
 ##  daemon's log file do you want included in the obituary?
-#OBITUARY_LOG_LENGTH		= 20
+OBITUARY_LOG_LENGTH		= 30
 ##  Should the master run?
-#START_MASTER			= True
+START_MASTER			= True
 ##  Should the master start up the daemons you want it to?
-#START_DAEMONS			= True
+START_DAEMONS			= True
 ##  How often do you want the master to send an update to the central
 ##  manager?
-#MASTER_UPDATE_INTERVAL		= 300
+MASTER_UPDATE_INTERVAL		= 300
 ##  How often do you want the master to check the timestamps of the
 ##  daemons it's running?  If any daemons have been modified, the
 ##  master restarts them.
-#MASTER_CHECK_NEW_EXEC_INTERVAL	= 300
+MASTER_CHECK_NEW_EXEC_INTERVAL	= 1800
 ##  Once you notice new binaries, how long should you wait before you
 ##  try to execute them?
-#MASTER_NEW_BINARY_DELAY	= 120
+MASTER_NEW_BINARY_DELAY	= 120
 ##  What's the maximum amount of time you're willing to give the
 ##  daemons to quickly shutdown before you just kill them outright?
-#SHUTDOWN_FAST_TIMEOUT		= 120
+SHUTDOWN_FAST_TIMEOUT		= 120
 ######
@@ Line 1154: / Line 1269: @@
 ##  the exponent used to determine how long to wait before starting
 ##  the daemon again:
-#MASTER_BACKOFF_FACTOR		= 2.0
+MASTER_BACKOFF_FACTOR		= 2.0
 ##  What's the maximum amount of time you want the master to wait
 ##  between attempts to start a given daemon?  (With 2.0 as the
 ##  MASTER_BACKOFF_FACTOR, you'd hit 1 hour in 12 restarts...)
-#MASTER_BACKOFF_CEILING		= 3600
+MASTER_BACKOFF_CEILING		= 3600
 ##  How long should a daemon run without crashing before we consider
 ##  it "recovered".  Once a daemon has recovered, we reset the number
 ##  of restarts so the exponential backoff stuff goes back to normal.
-#MASTER_RECOVER_FACTOR		= 300
+MASTER_RECOVER_FACTOR		= 300
@@ Line 1172: / Line 1287: @@
 ## Address to which Condor will send a weekly e-mail with output of
 ## condor_status.
+# NOTE: CONDOR_DEVELOPERS is defined in the local configuration files
 #CONDOR_DEVELOPERS = condor-admin@cs.wisc.edu
@@ Line 1184: / Line 1300: @@
 ## Determine if the Negotiator will honor SlotWeight attributes, which
 ## may be used to give a slot greater weight when calculating usage.
-#NEGOTIATOR_USE_SLOT_WEIGHTS = True
+NEGOTIATOR_USE_SLOT_WEIGHTS = True
 ## How often the Negotaitor starts a negotiation cycle, defined in
 ## seconds.
-#NEGOTIATOR_INTERVAL = 60
+NEGOTIATOR_INTERVAL = 60
 ## Should the Negotiator publish an update to the Collector after
 ## every negotiation cycle. It is useful to have this set to True
 ## to get immediate updates on LastNegotiationCycle statistics.
-#NEGOTIATOR_UPDATE_AFTER_CYCLE = False
+NEGOTIATOR_UPDATE_AFTER_CYCLE = False
@@ Line 1214: / Line 1330: @@
 ##  When a machine is claimed, how often should we poll the state of
 ##  the machine to see if we need to evict/suspend the job, etc?
-#POLLING_INTERVAL        = 5
+POLLING_INTERVAL        = 10
 ##  How often should the startd send updates to the central manager?
-#UPDATE_INTERVAL         = 300
+UPDATE_INTERVAL         = 300
 ##  How long is the startd willing to stay in the "matched" state?
-#MATCH_TIMEOUT		= 300
+MATCH_TIMEOUT		= 600
 ##  How long is the startd willing to stay in the preempting/killing
 ##  state before it just kills the starter directly?
-#KILLING_TIMEOUT	= 30
+KILLING_TIMEOUT	= 60
 ##  When a machine unclaimed, when should it run benchmarks?
@@ Line 1244: / Line 1360: @@
 ##  What's the max "load" of all running benchmarks?  With the default
 ##  (1.01), the startd will run the benchmarks serially.
-benchmarks_max_job_load = 1.0
+benchmarks_max_job_load = 1.01
 #  MIPS (Dhrystone 2.1) benchmark: load 1.0
@@ Line 1271: / Line 1387: @@
 ##  names of devices you want considered the console, without the
 ##  "/dev/" portion of the pathname.
-CONSOLE_DEVICES = mouse, console
+CONSOLE_DEVICES = console
@@ Line 1432: / Line 1548: @@
 ##  be "connected" to the keyboard (for remote tty activity, as well
 ##  as console activity).  Defaults to 1.
-#SLOTS_CONNECTED_TO_KEYBOARD = 1
+SLOTS_CONNECTED_TO_KEYBOARD = 1
 ##  If there are slots that aren't connected to the
@@ Line 1447: / Line 1563: @@
 ##  but you still want jobs to start right away on some of your SMP
 ##  nodes, just increase this parameter.
-#DISCONNECTED_KEYBOARD_IDLE_BOOST = 1200
+DISCONNECTED_KEYBOARD_IDLE_BOOST = 1200
 ######
@@ Line 1509: / Line 1625: @@
 ##  How often should the schedd send an update to the central manager?
-#SCHEDD_INTERVAL	= 300
+SCHEDD_INTERVAL	= 300
 ##  How long should the schedd wait between spawning each shadow?
-#JOB_START_DELAY	= 2
+JOB_START_DELAY	= 2
 ##  How many concurrent sub-processes should the schedd spawn to handle
 ##  queries?  (Unix only)
-#SCHEDD_QUERY_WORKERS   = 3
+SCHEDD_QUERY_WORKERS   = 10
 ##  How often should the schedd send a keep alive message to any
 ##  startds it has claimed?  (5 minutes)
-#ALIVE_INTERVAL		= 300
+ALIVE_INTERVAL		= 300
 ##  This setting controls the maximum number of times that a
@@ Line 1526: / Line 1642: @@
 ##  the condor_schedd will simply relinquish the match associated with
 ##  the dying shadow.
-#MAX_SHADOW_EXCEPTIONS	= 5
+MAX_SHADOW_EXCEPTIONS	= 5
 ##  Estimated virtual memory size of each condor_shadow process.
@@ Line 1535: / Line 1651: @@
 ##  submit machines.  How "nice" do you want the shadows? (1-19).
 ##  The higher the number, the lower priority the shadows have.
-# SHADOW_RENICE_INCREMENT	= 0
+SHADOW_RENICE_INCREMENT	= 1
 ## The condor_schedd can renice scheduler universe processes
@@ Line 1557: / Line 1673: @@
 ##  but it will ensure that all jobs that can be started will be
 ##  started.
-#NEGOTIATE_ALL_JOBS_IN_CLUSTER = False
+NEGOTIATE_ALL_JOBS_IN_CLUSTER = True
 ## This setting controls how often, in seconds, the schedd considers
@@ Line 1580: / Line 1696: @@
 ##  queue?  (These users will be able to remove other user's jobs).
 ##  By default, this only includes root.
-QUEUE_SUPER_USERS	= root, condor
+#
+# NOTE: QUEUE_SUPER_USERS is defined in the local configuration files
+#QUEUE_SUPER_USERS	= root, condor
@@ Line 1591: / Line 1709: @@
 ##  the job is started from scratch.  Defaults to 1 hour.  This
 ##  setting is only used if USE_CKPT_SERVER (from above) is True.
-#MAX_DISCARDED_RUN_TIME = 3600
+MAX_DISCARDED_RUN_TIME = 3600
 ##  Should periodic checkpoints be compressed?
-#COMPRESS_PERIODIC_CKPT = False
+COMPRESS_PERIODIC_CKPT = False
 ##  Should vacate checkpoints be compressed?
-#COMPRESS_VACATE_CKPT = False
+COMPRESS_VACATE_CKPT = False
 ##  Should we commit the application's dirty memory pages to swap
@@ Line 1610: / Line 1728: @@
 ##  How often should the shadow update the job queue with job
 ##  attributes that periodically change?  Specified in seconds.
-#SHADOW_QUEUE_UPDATE_INTERVAL = 15 * 60
+SHADOW_QUEUE_UPDATE_INTERVAL = 10 * 60
 ##  Should the shadow wait to update certain job attributes for the
@@ Line 1616: / Line 1734: @@
 ##  attributes as they change?  Due to performance concerns of
 ##  aggressive updates to a busy condor_schedd, the default is True.
-#SHADOW_LAZY_QUEUE_UPDATE = TRUE
+SHADOW_LAZY_QUEUE_UPDATE = TRUE
@@ Line 1630: / Line 1748: @@
 ##  zero (i.e. the job must be reniced) or the mechanism that
 ##  monitors CPU load on Win32 systems will give erratic results.
-#JOB_RENICE_INCREMENT	= 10
+JOB_RENICE_INCREMENT	= 4
 ##  Should the starter do local logging to its own log file, or send
 ##  debug information back to the condor_shadow where it will end up
 ##  in the ShadowLog?
-#STARTER_LOCAL_LOGGING	= TRUE
+STARTER_LOCAL_LOGGING	= FALSE
 ##  If the UID_DOMAIN settings match on both the execute and submit
@@ Line 1642: / Line 1760: @@
 ##  exit with an error.  Do you want the starter to just start up the
 ##  job with the specified UID, even if it's not in the passwd file?
-#SOFT_UID_DOMAIN	= FALSE
+SOFT_UID_DOMAIN	= FALSE
 ##  honor the run_as_owner option from the condor submit file.
 ##
-#STARTER_ALLOW_RUNAS_OWNER = TRUE
+STARTER_ALLOW_RUNAS_OWNER = TRUE
 ##  Tell the Starter/Startd what program to use to remove a directory
@@ Line 1703: / Line 1821: @@
 ##  site, uncomment these entries.
 #APPEND_REQUIREMENTS	= (expression to append job requirements)
-#APPEND_RANK		= (expression to append job rank)
+#APPEND_RANK		=
 ##  If you want expressions only appended for either standard or
@@ Line 1716: / Line 1834: @@
 ##  This can be used to define a default value for the rank expression
 ##  if one is not specified in the submit file.
-#DEFAULT_RANK	        = (default rank expression for all jobs)
+DEFAULT_RANK	        = 0
 ##  If you want universe-specific defaults, you can use the following
@@ Line 1748: / Line 1866: @@
 ##--------------------------------------------------------------------
 ##  Who should condor_preen send email to?
-#PREEN_ADMIN		= $(CONDOR_ADMIN)
+PREEN_ADMIN		= $(CONDOR_ADMIN)
 ##  What files should condor_preen leave in the spool directory?
@@ Line 1769: / Line 1887: @@
 JAVA = /usr/bin/java
+JAVA_MAXHEAP_ARGUMENT = -Xmx1024m
 ## JAVA_CLASSPATH_DEFAULT gives the default set of paths in which
@@ Line 2031: / Line 2150: @@
 ## Index file path of saved credentials.
 ## This file will be automatically created if it does not exist.
-#CRED_INDEX_FILE = $(CRED_STORE_DIR/cred-index
+CRED_INDEX_FILE = $(CRED_STORE_DIR)/cred-index
 ## condor_credd  will attempt to refresh credentials when their
@@ Line 2120: / Line 2239: @@
 # If this is set to true, then the rest of the QUILL arguments must be defined
-# for quill to function. If it is Fase or left undefined, then quill will not
+# for quill to function. If it is False or left undefined, then quill will not
 # be consulted by either the scheduler or the tools, but in the case of a
 # remote quill query where the local client has quill turned off, but the
 # remote client has quill turned on, things will still function normally.
-#QUILL_ENABLED = TRUE
+QUILL_ENABLED = FALSE
 #
@@ Line 2523: / Line 2642: @@
 ## name node (see HDFS_SERVICES) then the specified port will be used
 ## to run name node.
-HDFS_NAMENODE = hdfs://example.com:9000
+#HDFS_NAMENODE = hdfs://example.com:9000
-HDFS_NAMENODE_WEB = example.com:8000
+#HDFS_NAMENODE_WEB = example.com:8000
-HDFS_BACKUPNODE = hdfs://example.com:50100
+#HDFS_BACKUPNODE = hdfs://example.com:50100
-HDFS_BACKUPNODE_WEB = example.com:50105
+#HDFS_BACKUPNODE_WEB = example.com:50105
 ## You need to pick one machine as name node by setting this parameter
@@ Line 2585: / Line 2704: @@
-===== Condor Master Local Configuration File =====
+=====Central Manager Shared Configuration File=====
-<file autoconf condor_config.local>##  What machine is your central manager?
+<file autoconf condor_config_manager.shared># Which daemons should run?  This essentially defines
-CONDOR_HOST = john.cs.wlu.edu
+# the machine's role in the Condor system.
-##  Where is the local condor directory for each host?
-##  This is where the local config file(s), logs and
-##  spool/execute directories are located
-LOCAL_DIR = /var/lib/condor
-##  Mail parameters:
-##  When something goes wrong with condor at your site, who should get
-##  the email?
-CONDOR_ADMIN = kollerg14@mail.wlu.edu
-##  Full path to a mail delivery program that understands that "-s"
-##  means you want to specify a subject:
-MAIL = /bin/mailx
-##  Network domain parameters:
-##  Internet domain of machines sharing a common UID space.  If your
-##  machines don't share a common UID space, set it to
-##  UID_DOMAIN = $(FULL_HOSTNAME)
-##  to specify that each machine has its own UID space.
-UID_DOMAIN = cs.wlu.edu
-##  Internet domain of machines sharing a common file system.
-##  If your machines don't use a network file system, set it to
-##  FILESYSTEM_DOMAIN = $(FULL_HOSTNAME)
-##  to specify that each machine has its own file system.
-FILESYSTEM_DOMAIN = cs.wlu.edu
-##  The user/group ID <uid>.<gid> of the "Condor" user.
-##  (this can also be specified in the environment)
-##  Note: the CONDOR_IDS setting is ignored on Win32 platforms
-CONDOR_IDS = 201.481
-##  Condor needs to create a few lock files to synchronize access to
-##  various log files.  Because of problems we've had with network
-##  filesystems and file locking over the years, we HIGHLY recommend
-##  that you put these lock files on a local partition on each
-##  machine.  If you don't have your LOCAL_DIR on a local partition,
-##  be sure to change this entry.  Whatever user (or group) condor is
-##  running as needs to have write access to this directory.  If
-##  you're not running as root, this is whatever user you started up
-##  the condor_master as.  If you are running as root, and there's a
-##  condor account, it's probably condor.  Otherwise, it's whatever
-##  you've set in the CONDOR_IDS environment variable.  See the Admin
-##  manual for details on this.
-LOCK = /tmp/condor-lock.$(HOSTNAME)0.0934767702865464
 DAEMON_LIST = COLLECTOR, MASTER, NEGOTIATOR, SCHEDD, STARTD, KBDD
-##  Java parameters:
+##--------------------------------------------------------------------
-##  If you would like this machine to be able to run Java jobs,
+##  condor_collector
-##  then set JAVA to the path of your JVM binary.  If you are not
+##--------------------------------------------------------------------
-##  interested in Java, there is no harm in leaving this entry
+## Address to which Condor will send a weekly e-mail with output of
-##  empty or incorrect.
+## condor_status.
-JAVA = /usr/bin/java
+CONDOR_DEVELOPERS = condor-admin@cs.wisc.edu</file>
-JAVA_MAXHEAP_ARGUMENT = -Xmx1024m
-# Designate which machines are members of this pool.
-PoolMembers = carl.cs.wlu.edu, fred.cs.wlu.edu
-# Allow machines to check the status of Condor
-ALLOW_READ = $(ALLOW_READ), $(PoolMembers)
-# Allow machines to join this pool
-ALLOW_WRITE = $(ALLOW_WRITE), $(PoolMembers)
-FLOCK_FROM = $(PoolMembers)
-# Enable debugging of Class Ads
-LeaseManager.DEBUG_ADS = True</file>
-===== Worker Local Configuration File =====
-<file autoconf condor_config.local>PoolMaster = john.cs.wlu.edu
-CONDOR_DEVELOPERS = NONE
-CONDOR_HOST = $(PoolMaster)
-COLLECTOR_NAME = Orion
-# If job submitter user is listed here, start the job regardless of
-# who might be using the computer at the time.
-IsGreedyUser =  (Owner == "stoughj" \
-                     || Owner == "stough" \
-                     || Owner == "koller" \
-                     || Owner == "gkoller" \
-                     || Owner == "nguyenp" \
-                     || Owner == "davisl")
-START = ( ( (KeyboardIdle > $(StartIdleTime)) \
-                    && ( $(CPUIdle) || \
-                         (State != "Unclaimed" && State != "Owner")) ) \
-              || $(IsGreedyUser) )
-SUSPEND = FALSE
-PREEMPT = FALSE
-KILL = FALSE
+=====Worker Shared Configuration File=====
+<file autoconf condor_config_worker.shared># Which daemons should run?  This essentially defines
+# the machine's role in the Condor system.
 DAEMON_LIST = MASTER, STARTD, KBDD
-NEGOTIATOR_INTERVAL = 20
-TRUST_UID_DOMAIN = TRUE
-# Join the W&L CS Pool (Orion)
+##--------------------------------------------------------------------
-FLOCK_TO = john.cs.wlu.edu
+##  condor_collector
-ALLOW_WRITE = $(ALLOW_WRITE), $(PoolMaster)
+##--------------------------------------------------------------------
+## Address to which Condor will send a weekly e-mail with output of
-# Enable debugging of Class Ads
+## condor_status.
-LeaseManager.DEBUG_ADS = True</file>
+# Don't send monthly statistics emails.
+# The central manager will do that.
+CONDOR_DEVELOPERS = NONE</file>