########################################################################## # This is a sample configuration file for enabling HA mechanism on # # the machines, running collector and negotiator, i.e. central managers # # Use another file to configure submission and execution machines # ########################################################################## # unset these two macros - they are deprecated NEGOTIATOR_HOST= CONDOR_HOST= ######################################################################### ## THE FOLLOWING SET OF PARAMETERS SHOULD BE IDENTICAL ON ALL # ## CENTRAL MANAGERS!!!!!!!!!! # ######################################################################### ## For simplicity we define a variable for each central manager in the pool. ## Here we define only two central managers, but we tested up to 5, ## and in theory this number is not bounded. ## Please substituted them with the hostnames of central managers in your pool CENTRAL_MANAGER1 = cm1.cs.technion.ac.il CENTRAL_MANAGER2 = cm2.cs.technion.ac.il ## List of all central managers in the pool ## These hosts are for example only. Please change them to ## the hostnames of the central managers in your pool COLLECTOR_HOST = $(CENTRAL_MANAGER1),$(CENTRAL_MANAGER2) ## The following macro defines the port number condor_had will listen ## on on this machine. This port should match the port number specified ## for that HAD in the HAD_LIST ## Port number is arbitrary (make sure no collision with other applications) ## This is a sample port number HAD_PORT = 51450 HAD_ARGS = -p $(HAD_PORT) ## The following list must contain the same addresses and in the same order ## as COLLECTOR_HOST. In addition, for each hostname, it should specify ## the port number of condor_had daemon running on that host. ## The first machine in the list will be the PRIMARY central manager machine, ## in case HAD_USE_PRIMARY is set to true. HAD_LIST = $(CENTRAL_MANAGER1):$(HAD_PORT),$(CENTRAL_MANAGER2):$(HAD_PORT) ## HAD connection time. This is a period of time it usually takes to ## establish TCP connection between your central managers. ## Set this to 2 if your central managers are on the same subnet ## Set this to 5 if you have Condor security enabled ## Set this to 10 if your network is very slow, or you want ## to reduce the sensitivity of HA daemons to the network failures HAD_CONNECTION_TIMEOUT = 2 ##If HAD_USE_PRIMARY=true, the first Central Manager in the HAD_LIST is primary. HAD_USE_PRIMARY = true ##-------------------------------------------------------------------- ## Host/IP access levels ##-------------------------------------------------------------------- ## Please see the administrator's manual for details on these ## settings, what they're for, and how to use them. ## What machines have administrative rights for your pool? This ## defaults to your central manager. You should set it to the ## machine(s) where whoever is the condor administrator(s) works ## (assuming you trust all the users who log into that/those ## machine(s), since this is machine-wide access you're granting). HOSTALLOW_ADMINISTRATOR = $(COLLECTOR_HOST) ## Negotiator access. Machines listed here are trusted central ## managers. You should normally not have to change this. HOSTALLOW_NEGOTIATOR = $(COLLECTOR_HOST) ## Now, with flocking (and HA) we need to let the SCHEDD trust the other ## negotiators we are flocking with as well. You should normally ## not need to change this. HOSTALLOW_NEGOTIATOR_SCHEDD = $(COLLECTOR_HOST) ################################################################### ## THE PARAMETERS BELOW ARE ALLOWED TO BE DIFFERENT ON EACH # ## CENTRAL MANAGERS # ################################################################### ## The location of executable files HAD = $(SBIN)/condor_had ## Master should start at least these four daemons DAEMON_LIST = MASTER, COLLECTOR, NEGOTIATOR, HAD ##DC_Daemon list should contain at least these four DC_DAEMON_LIST = MASTER, COLLECTOR, NEGOTIATOR, HAD ## The size of HAD log file MAX_HAD_LOG = 640000 ## HAD debug level HAD_DEBUG = D_COMMAND ## HAD Log file HAD_LOG = $(LOG)/HADLog