[Swift-commit] cog r3821

swift at ci.uchicago.edu swift at ci.uchicago.edu
Mon Oct 28 14:40:03 CDT 2013


------------------------------------------------------------------------
r3821 | yadunand | 2013-10-28 14:36:24 -0500 (Mon, 28 Oct 2013) | 4 lines


Adding scripts to start coasters and a README for the
tcl examples for starting and using a persistent coaster service

------------------------------------------------------------------------
Index: modules/provider-coaster-c-client/tests/coasters/coaster-service.conf
===================================================================
--- modules/provider-coaster-c-client/tests/coasters/coaster-service.conf	(revision 0)
+++ modules/provider-coaster-c-client/tests/coasters/coaster-service.conf	(revision 3821)
@@ -0,0 +1,43 @@
+# Keep all interesting settings in one place
+# User should modify this to fit environment
+
+# Location of SWIFT. If empty, PATH is referenced
+export SWIFT=/homes/yadunand/swift-trunk/cog/modules/swift/dist/swift-svn/bin/swift
+
+# Where to place/launch worker.pl on the remote machine
+export WORKER_LOCATION=/homes/$USER
+
+# How to launch workers: local, ssh, futuregrid, or cobalt
+export WORKER_MODE=ssh
+export WORKER_USERNAME=$USER
+
+# Worker host names for ssh
+export WORKER_HOSTS="crush.mcs.anl.gov grind.mcs.anl.gov"
+
+# Directory to keep log files, relative to working directory when launching start-coaster-service
+export LOG_DIR=logs
+
+# Manually define ports. If not specified, ports will be automatically generated
+export LOCAL_PORT=
+export SERVICE_PORT=
+
+# start-coaster-service tries to automatically detect IP address. 
+# Specify here if auto detection is not working correctly
+export IPADDR=140.221.8.81
+
+# Gensites values
+export WORK=/sandbox/$USER
+
+# If SHARED_FILESYSTEM is set to no, provider staging will be turned on
+export SHARED_FILESYSTEM=no
+
+# If running outside of mcs network, set WORKER_RELAY_HOST below
+# export WORKER_RELAY_HOST="login.mcs.anl.gov"
+
+export WORKER_LOGGING_LEVEL=DEBUG
+export WORKER_LOG_DIR="/homes/$USER/logs"
+export JOBSPERNODE="4"
+export JOBTHROTTLE=100
+
+# Set applications here
+#app cat=/bin/cat
Index: modules/provider-coaster-c-client/tests/coasters/sites.xml
===================================================================
--- modules/provider-coaster-c-client/tests/coasters/sites.xml	(revision 0)
+++ modules/provider-coaster-c-client/tests/coasters/sites.xml	(revision 3821)
@@ -0,0 +1,12 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<config xmlns="http://www.ci.uchicago.edu/swift/SwiftSites">
+  <pool handle="persistent-coasters">
+    <execution provider="coaster-persistent" url="http://140.221.8.81:58318" jobmanager="local:local"/>
+    <profile namespace="globus" key="workerManager">passive</profile>
+    <profile namespace="globus" key="jobsPerNode">4</profile>
+    <profile key="jobThrottle" namespace="karajan">100</profile>
+    <profile namespace="karajan" key="initialScore">10000</profile>
+    <filesystem provider="local" url="none" />
+    <workdirectory>/sandbox/yadunand</workdirectory>
+  </pool>
+</config>
Index: modules/provider-coaster-c-client/tests/coasters/start-coaster-service.log
===================================================================
--- modules/provider-coaster-c-client/tests/coasters/start-coaster-service.log	(revision 0)
+++ modules/provider-coaster-c-client/tests/coasters/start-coaster-service.log	(revision 3821)
@@ -0,0 +1,91 @@
+Running /homes/yadunand/swift-trunk/cog/modules/swift/dist/swift-svn/bin/coaster-service -nosec -portfile /tmp/tmp.KmXG9rMorq -localportfile /tmp/tmp.D9N8ytVG6b -passive
+Switching log to: cps-2013-10-28_14-31-16.log
+2013-10-28 14:31:16,524-0500 WARN  CoasterPersistentService Switching log to: cps-2013-10-28_14-31-16.log
+Local contacts: [http://140.221.8.81:56573]
+2013-10-28 14:31:16,602-0500 INFO  Settings Local contacts: [http://140.221.8.81:56573]
+Starting... id=1028-3102160
+2013-10-28 14:31:16,615-0500 INFO  BlockQueueProcessor Starting... id=1028-3102160
+Started local service: http://140.221.8.81:56573
+2013-10-28 14:31:16,615-0500 INFO  CoasterService Started local service: http://140.221.8.81:56573
+Started coaster service: http://140.221.8.81:58318
+2013-10-28 14:31:16,615-0500 INFO  CoasterService Started coaster service: http://140.221.8.81:58318
+Started coaster service: http://140.221.8.81:58318
+Worker connection URL: http://140.221.8.81:56573
+Running ssh yadunand at crush.mcs.anl.gov mkdir -p /homes/yadunand
+Running scp /homes/yadunand/swift-trunk/cog/modules/swift/dist/swift-svn/bin/worker.pl yadunand at crush.mcs.anl.gov:/homes/yadunand
+Running ssh yadunand at crush.mcs.anl.gov WORKER_LOGGING_LEVEL=DEBUG /homes/yadunand/worker.pl http://140.221.8.81:56573 crush.mcs.anl.gov /homes/yadunand/logs
+Running ssh yadunand at grind.mcs.anl.gov mkdir -p /homes/yadunand
+Timeout check started for TCPChannel [type: server, contact: unknown]
+2013-10-28 14:31:18,748-0500 INFO  AbstractCoasterChannel Timeout check started for TCPChannel [type: server, contact: unknown]
+Channel started: TCPChannel [type: server, contact: 140.221.8.62:34285]
+2013-10-28 14:31:18,753-0500 INFO  AbstractTCPChannel Channel started: TCPChannel [type: server, contact: 140.221.8.62:34285]
+Received registration: blockid = crush.mcs.anl.gov, url = crush
+2013-10-28 14:31:18,758-0500 INFO  LocalTCPService Received registration: blockid = crush.mcs.anl.gov, url = crush
+MetaChannel [context: worker-1, boundTo: null] binding to TCPChannel [type: server, contact: 140.221.8.62:34285]
+2013-10-28 14:31:18,780-0500 INFO  MetaChannel MetaChannel [context: worker-1, boundTo: null] binding to TCPChannel [type: server, contact: 140.221.8.62:34285]
+Running scp /homes/yadunand/swift-trunk/cog/modules/swift/dist/swift-svn/bin/worker.pl yadunand at grind.mcs.anl.gov:/homes/yadunand
+2013-10-28 14:31:18,784-0500 DEBUG Cpu worker started: block=crush.mcs.anl.gov host=crush id=0
+2013-10-28 14:31:18,784-0500 DEBUG Cpu ready for work: block=crush.mcs.anl.gov id=0
+Started CPU 0:1382988678s
+2013-10-28 14:31:18,786-0500 INFO  Block Started CPU 0:1382988678s
+Started worker crush.mcs.anl.gov:000000
+2013-10-28 14:31:18,786-0500 INFO  Block Started worker crush.mcs.anl.gov:000000
+2013-10-28 14:31:18,786-0500 DEBUG Cpu requesting work: block=crush.mcs.anl.gov id=0 Cpus sleeping: 1
+Using NIO sender for TCPChannel [type: server, contact: crush.mcs.anl.gov-000000]
+2013-10-28 14:31:18,786-0500 INFO  AbstractStreamCoasterChannel Using NIO sender for TCPChannel [type: server, contact: crush.mcs.anl.gov-000000]
+2013-10-28 14:31:18,787-0500 DEBUG Cpu crush.mcs.anl.gov:0 sleeping
+Handler(tag: 9512, REGISTER) unregistering (send)
+2013-10-28 14:31:18,791-0500 INFO  RequestHandler Handler(tag: 9512, REGISTER) unregistering (send)
+Running ssh yadunand at grind.mcs.anl.gov WORKER_LOGGING_LEVEL=DEBUG /homes/yadunand/worker.pl http://140.221.8.81:56573 grind.mcs.anl.gov /homes/yadunand/logs
+Adjusting buffer size to 8650752 for 2 sockets
+2013-10-28 14:31:19,639-0500 INFO  TCPBufferManager Adjusting buffer size to 8650752 for 2 sockets
+Timeout check started for TCPChannel [type: server, contact: unknown]
+2013-10-28 14:31:19,639-0500 INFO  AbstractCoasterChannel Timeout check started for TCPChannel [type: server, contact: unknown]
+Channel started: TCPChannel [type: server, contact: 140.221.8.74:39025]
+2013-10-28 14:31:19,639-0500 INFO  AbstractTCPChannel Channel started: TCPChannel [type: server, contact: 140.221.8.74:39025]
+Received registration: blockid = grind.mcs.anl.gov, url = grind
+2013-10-28 14:31:19,639-0500 INFO  LocalTCPService Received registration: blockid = grind.mcs.anl.gov, url = grind
+MetaChannel [context: worker-2, boundTo: null] binding to TCPChannel [type: server, contact: 140.221.8.74:39025]
+2013-10-28 14:31:19,640-0500 INFO  MetaChannel MetaChannel [context: worker-2, boundTo: null] binding to TCPChannel [type: server, contact: 140.221.8.74:39025]
+2013-10-28 14:31:19,640-0500 DEBUG Cpu worker started: block=grind.mcs.anl.gov host=grind id=0
+2013-10-28 14:31:19,640-0500 DEBUG Cpu ready for work: block=grind.mcs.anl.gov id=0
+Started CPU 0:1382988679s
+2013-10-28 14:31:19,640-0500 INFO  Block Started CPU 0:1382988679s
+2013-10-28 14:31:19,640-0500 DEBUG Cpu requesting work: block=grind.mcs.anl.gov id=0 Cpus sleeping: 2
+Started worker grind.mcs.anl.gov:000000
+2013-10-28 14:31:19,640-0500 INFO  Block Started worker grind.mcs.anl.gov:000000
+2013-10-28 14:31:19,640-0500 DEBUG Cpu grind.mcs.anl.gov:0 sleeping
+Handler(tag: 932, REGISTER) unregistering (send)
+2013-10-28 14:31:19,640-0500 INFO  RequestHandler Handler(tag: 932, REGISTER) unregistering (send)
+TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:31:58,230-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+TCPChannel [type: server, contact: grind.mcs.anl.gov-000000] up latency: 0ms, rtt: 2ms
+2013-10-28 14:31:58,540-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: grind.mcs.anl.gov-000000] up latency: 0ms, rtt: 2ms
+TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:32:29,185-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+TCPChannel [type: server, contact: grind.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:32:36,733-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: grind.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:33:00,143-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+TCPChannel [type: server, contact: grind.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:33:14,927-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: grind.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:33:31,101-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+TCPChannel [type: server, contact: grind.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:33:53,121-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: grind.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:34:02,059-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+TCPChannel [type: server, contact: grind.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:34:31,315-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: grind.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:34:33,017-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:35:03,976-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+TCPChannel [type: server, contact: grind.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:35:09,509-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: grind.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:35:34,933-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+TCPChannel [type: server, contact: grind.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:35:47,703-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: grind.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
+2013-10-28 14:36:05,891-0500 INFO  HeartBeatCommand TCPChannel [type: server, contact: crush.mcs.anl.gov-000000] up latency: 0ms, rtt: 1ms
Index: modules/provider-coaster-c-client/tests/coasters/tc.data
===================================================================
--- modules/provider-coaster-c-client/tests/coasters/tc.data	(revision 0)
+++ modules/provider-coaster-c-client/tests/coasters/tc.data	(revision 3821)
@@ -0,0 +1 @@
+persistent-coasters cat /bin/cat null null null
Index: modules/provider-coaster-c-client/tests/tcl/README
===================================================================
--- modules/provider-coaster-c-client/tests/tcl/README	(revision 0)
+++ modules/provider-coaster-c-client/tests/tcl/README	(revision 3821)
@@ -0,0 +1,5 @@
+Run start-coaster-service in the coasters folder to start a coaster service.
+The configuration for coasters is in coaster-service.conf
+
+Use the url in the sites.xml generated in the tcl examples to connect to the
+coaster service
\ No newline at end of file



More information about the Swift-commit mailing list