LinuxApplication: making single deploy.sh script out of http_sources.sh, build.sh...

[nepi.git] / src / nepi / resources / linux / application.py
diff --git a/src/nepi/resources/linux/application.py b/src/nepi/resources/linux/application.py

index 080c3a4..506285a 100644 (file)
--- a/src/nepi/resources/linux/application.py
+++ b/src/nepi/resources/linux/application.py
@@ -19,28 +19,82 @@
  
  from nepi.execution.attribute import Attribute, Flags, Types
  from nepi.execution.trace import Trace, TraceAttr
-from nepi.execution.resource import ResourceManager, clsinit, ResourceState
+from nepi.execution.resource import ResourceManager, clsinit, ResourceState, \
+    reschedule_delay
  from nepi.resources.linux.node import LinuxNode
-from nepi.util import sshfuncs 
-from nepi.util.timefuncs import strfnow, strfdiff
+from nepi.util.sshfuncs import ProcStatus
+from nepi.util.timefuncs import tnow, tdiffsec
  
  import os
-
-reschedule_delay = "0.5s"
-state_check_delay = 1
+import subprocess
  
  # TODO: Resolve wildcards in commands!!
-# TODO: If command is not set give a warning but do not generate an error!
+# TODO: During provisioning, everything that is not scp could be
+#       uploaded to a same script, http_sources download, etc...
+#       and like that require performing less ssh connections!!!
+# TODO: Make stdin be a symlink to the original file in ${SHARE}
+#       - later use md5sum to check wether the file needs to be re-upload
+
  
  @clsinit
  class LinuxApplication(ResourceManager):
+    """
+    .. class:: Class Args :
+      
+        :param ec: The Experiment controller
+        :type ec: ExperimentController
+        :param guid: guid of the RM
+        :type guid: int
+
+    .. note::
+
+    A LinuxApplication RM represents a process that can be executed in
+    a remote Linux host using SSH.
+
+    The LinuxApplication RM takes care of uploadin sources and any files
+    needed to run the experiment, to the remote host. 
+    It also allows to provide source compilation (build) and installation 
+    instructions, and takes care of automating the sources build and 
+    installation tasks for the user.
+
+    It is important to note that files uploaded to the remote host have
+    two possible scopes: single-experiment or multi-experiment.
+    Single experiment files are those that will not be re-used by other 
+    experiments. Multi-experiment files are those that will.
+    Sources and shared files are always made available to all experiments.
+
+    Directory structure:
+
+    The directory structure used by LinuxApplication RM at the Linux
+    host is the following:
+
+        ${HOME}/nepi-usr --> Base directory for multi-experiment files
+                      |
+        ${LIB}        |- /lib --> Base directory for libraries
+        ${BIN}        |- /bin --> Base directory for binary files
+        ${SRC}        |- /src --> Base directory for sources
+        ${SHARE}      |- /share --> Base directory for other files
+
+        ${HOME}/nepi-exp --> Base directory for single-experiment files
+                      |
+        ${EXP_HOME}   |- /<exp-id>  --> Base directory for experiment exp-id
+                          |
+        ${APP_HOME}       |- /<app-guid> --> Base directory for application 
+                               |     specific files (e.g. command.sh, input)
+                               | 
+        ${RUN_HOME}            |- /<run-id> --> Base directory for run specific
+
+    """
+
      _rtype = "LinuxApplication"
  
      @classmethod
      def _register_attributes(cls):
-        command = Attribute("command", "Command to execute", 
+        command = Attribute("command", "Command to execute at application start. "
+                "Note that commands will be executed in the ${RUN_HOME} directory, "
+                "make sure to take this into account when using relative paths. ", 
                  flags = Flags.ExecReadOnly)
-        forward_x11 = Attribute("forwardX11", " Enables X11 forwarding for SSH connections", 
+        forward_x11 = Attribute("forwardX11", "Enables X11 forwarding for SSH connections", 
                  flags = Flags.ExecReadOnly)
          env = Attribute("env", "Environment variables string for command execution",
                  flags = Flags.ExecReadOnly)
@@ -50,40 +104,48 @@ class LinuxApplication(ResourceManager):
                  "Space-separated list of packages required to run the application",
                  flags = Flags.ExecReadOnly)
          sources = Attribute("sources", 
-                "Space-separated list of regular files to be deployed in the working "
-                "path prior to building. Archives won't be expanded automatically.",
+                "Space-separated list of regular files to be uploaded to ${SRC} "
+                "directory prior to building. Archives won't be expanded automatically. "
+                "Sources are globally available for all experiments unless "
+                "cleanHome is set to True (This will delete all sources). ",
+                flags = Flags.ExecReadOnly)
+        files = Attribute("files", 
+                "Space-separated list of regular miscellaneous files to be uploaded "
+                "to ${SHARE} directory. "
+                "Files are globally available for all experiments unless "
+                "cleanHome is set to True (This will delete all files). ",
+                flags = Flags.ExecReadOnly)
+        libs = Attribute("libs", 
+                "Space-separated list of libraries (e.g. .so files) to be uploaded "
+                "to ${LIB} directory. "
+                "Libraries are globally available for all experiments unless "
+                "cleanHome is set to True (This will delete all files). ",
+                flags = Flags.ExecReadOnly)
+        bins = Attribute("bins", 
+                "Space-separated list of binary files to be uploaded "
+                "to ${BIN} directory. "
+                "Binaries are globally available for all experiments unless "
+                "cleanHome is set to True (This will delete all files). ",
                  flags = Flags.ExecReadOnly)
          code = Attribute("code", 
-                "Plain text source code to be uploaded to the server. It will be stored "
-                "under ${SOURCES}/code",
+                "Plain text source code to be uploaded to the ${APP_HOME} directory. ",
                  flags = Flags.ExecReadOnly)
          build = Attribute("build", 
                  "Build commands to execute after deploying the sources. "
-                "Sources will be in the ${SOURCES} folder. "
-                "Example: tar xzf ${SOURCES}/my-app.tgz && cd my-app && ./configure && make && make clean.\n"
-                "Try to make the commands return with a nonzero exit code on error.\n"
-                "Also, do not install any programs here, use the 'install' attribute. This will "
-                "help keep the built files constrained to the build folder (which may "
-                "not be the home folder), and will result in faster deployment. Also, "
-                "make sure to clean up temporary files, to reduce bandwidth usage between "
-                "nodes when transferring built packages.",
+                "Sources are uploaded to the ${SRC} directory and code "
+                "is uploaded to the ${APP_HOME} directory. \n"
+                "Usage example: tar xzf ${SRC}/my-app.tgz && cd my-app && "
+                "./configure && make && make clean.\n"
+                "Make sure to make the build commands return with a nonzero exit "
+                "code on error.",
                  flags = Flags.ReadOnly)
          install = Attribute("install", 
                  "Commands to transfer built files to their final destinations. "
-                "Sources will be in the initial working folder, and a special "
-                "tag ${SOURCES} can be used to reference the experiment's "
-                "home folder (where the application commands will run).\n"
-                "ALL sources and targets needed for execution must be copied there, "
-                "if building has been enabled.\n"
-                "That is, 'slave' nodes will not automatically get any source files. "
-                "'slave' nodes don't get build dependencies either, so if you need "
-                "make and other tools to install, be sure to provide them as "
-                "actual dependencies instead.",
+                "Install commands are executed after build commands. ",
                  flags = Flags.ReadOnly)
-        stdin = Attribute("stdin", "Standard input", flags = Flags.ExecReadOnly)
-        stdout = Attribute("stdout", "Standard output", flags = Flags.ExecReadOnly)
-        stderr = Attribute("stderr", "Standard error", flags = Flags.ExecReadOnly)
-        tear_down = Attribute("tearDown", "Bash script to be executed before "
+        stdin = Attribute("stdin", "Standard input for the 'command'", 
+                flags = Flags.ExecReadOnly)
+        tear_down = Attribute("tearDown", "Command to be executed just before " 
                  "releasing the resource", 
                  flags = Flags.ReadOnly)
  
@@ -94,32 +156,36 @@ class LinuxApplication(ResourceManager):
          cls._register_attribute(depends)
          cls._register_attribute(sources)
          cls._register_attribute(code)
+        cls._register_attribute(files)
+        cls._register_attribute(bins)
+        cls._register_attribute(libs)
          cls._register_attribute(build)
          cls._register_attribute(install)
          cls._register_attribute(stdin)
-        cls._register_attribute(stdout)
-        cls._register_attribute(stderr)
          cls._register_attribute(tear_down)
  
      @classmethod
      def _register_traces(cls):
          stdout = Trace("stdout", "Standard output stream")
          stderr = Trace("stderr", "Standard error stream")
-        buildlog = Trace("buildlog", "Output of the build process")
  
          cls._register_trace(stdout)
          cls._register_trace(stderr)
-        cls._register_trace(buildlog)
  
      def __init__(self, ec, guid):
          super(LinuxApplication, self).__init__(ec, guid)
          self._pid = None
          self._ppid = None
          self._home = "app-%s" % self.guid
+        self._in_foreground = False
+
+        # keep a reference to the running process handler when 
+        # the command is not executed as remote daemon in background
+        self._proc = None
  
          # timestamp of last state check of the application
-        self._last_state_check = strfnow()
-    
+        self._last_state_check = tnow()
+
      def log_message(self, msg):
          return " guid %d - host %s - %s " % (self.guid, 
                  self.node.get("hostname"), msg)
@@ -135,12 +201,8 @@ class LinuxApplication(ResourceManager):
          return os.path.join(self.node.exp_home, self._home)
  
      @property
-    def src_dir(self):
-        return os.path.join(self.app_home, 'src')
-
-    @property
-    def build_dir(self):
-        return os.path.join(self.app_home, 'build')
+    def run_home(self):
+        return os.path.join(self.app_home, self.ec.run_id)
  
      @property
      def pid(self):
@@ -150,10 +212,23 @@ class LinuxApplication(ResourceManager):
      def ppid(self):
          return self._ppid
  
+    @property
+    def in_foreground(self):
+        """ Returns True if the command needs to be executed in foreground.
+        This means that command will be executed using 'execute' instead of
+        'run' ('run' executes a command in background and detached from the 
+        terminal)
+        
+        When using X11 forwarding option, the command can not run in background
+        and detached from a terminal, since we need to keep the terminal attached 
+        to interact with it.
+        """
+        return self.get("forwardX11") or self._in_foreground
+
      def trace(self, name, attr = TraceAttr.ALL, block = 512, offset = 0):
          self.info("Retrieving '%s' trace %s " % (name, attr))
  
-        path = os.path.join(self.app_home, name)
+        path = os.path.join(self.run_home, name)
          
          command = "(test -f %s && echo 'success') || echo 'error'" % path
          (out, err), proc = self.node.execute(command)
@@ -167,7 +242,7 @@ class LinuxApplication(ResourceManager):
              return path
  
          if attr == TraceAttr.ALL:
-            (out, err), proc = self.node.check_output(self.app_home, name)
+            (out, err), proc = self.node.check_output(self.run_home, name)
              
              if err and proc.poll():
                  msg = " Couldn't read trace %s " % name
@@ -194,135 +269,193 @@ class LinuxApplication(ResourceManager):
          return out
              
      def provision(self):
-        # create home dir for application
-        self.node.mkdir(self.app_home)
-
-        # upload sources
-        self.upload_sources()
-
-        # upload code
-        self.upload_code()
-
-        # upload stdin
-        self.upload_stdin()
+        # create run dir for application
+        self.node.mkdir(self.run_home)
+   
+        # List of all the provision methods to invoke
+        steps = [
+            # upload sources
+            self.upload_sources,
+            # upload files
+            self.upload_files,
+            # upload binaries
+            self.upload_binaries,
+            # upload libraries
+            self.upload_libraries,
+            # upload code
+            self.upload_code,
+            # upload stdin
+            self.upload_stdin,
+            # install dependencies
+            self.install_dependencies,
+            # build
+            self.build,
+            # Install
+            self.install]
+
+        command = []
+
+        # Since provisioning takes a long time, before
+        # each step we check that the EC is still 
+        for step in steps:
+            if self.ec.finished:
+                raise RuntimeError, "EC finished"
+            
+            ret = step()
+            if ret:
+                command.append(ret)
  
-        # install dependencies
-        self.install_dependencies()
+        # upload deploy script
+        deploy_command = ";".join(command)
+        self.execute_deploy_command(deploy_command)
  
-        # build
-        self.build()
+        # upload start script
+        self.upload_start_command()
+       
+        self.info("Provisioning finished")
  
-        # Install
-        self.install()
+        super(LinuxApplication, self).provision()
  
+    def upload_start_command(self):
+        # Upload command to remote bash script
+        # - only if command can be executed in background and detached
          command = self.get("command")
-        x11 = self.get("forwardX11")
-        if not x11 and command:
-            self.info("Uploading command '%s'" % command)
-
-            # Export environment
-            environ = ""
-            if self.get("env"):
-                for var in self.get("env").split(" "):
-                    environ += 'export %s\n' % var
  
-            command = environ + command
+        if command and not self.in_foreground:
+            self.info("Uploading command '%s'" % command)
  
-            # If the command runs asynchronous, pre upload the command 
-            # to the app.sh file in the remote host
-            dst = os.path.join(self.app_home, "app.sh")
+            # replace application specific paths in the command
              command = self.replace_paths(command)
-            self.node.upload(command, dst, text = True)
-
-        super(LinuxApplication, self).provision()
+            
+            # replace application specific paths in the environment
+            env = self.get("env")
+            env = env and self.replace_paths(env)
+
+            shfile = os.path.join(self.app_home, "start.sh")
+
+            self.node.upload_command(command, 
+                    shfile = shfile,
+                    env = env)
+
+    def execute_deploy_command(self, command):
+        if command:
+            # Upload the command to a bash script and run it
+            # in background ( but wait until the command has
+            # finished to continue )
+            shfile = os.path.join(self.app_home, "deploy.sh")
+            self.node.run_and_wait(command, self.run_home,
+                    shfile = shfile, 
+                    overwrite = False,
+                    pidfile = "deploy_pidfile", 
+                    ecodefile = "deploy_exitcode", 
+                    stdout = "deploy_stdout", 
+                    stderr = "deploy_stderr")
  
      def upload_sources(self):
-        # TODO: check if sources need to be uploaded and upload them
          sources = self.get("sources")
-        if sources:
-            self.info(" Uploading sources ")
+   
+        command = ""
  
-            # create dir for sources
-            self.node.mkdir(self.src_dir)
+        if sources:
+            self.info("Uploading sources ")
  
              sources = sources.split(' ')
  
-            http_sources = list()
+            # Separate sources that should be downloaded from 
+            # the web, from sources that should be uploaded from
+            # the local machine
+            command = []
              for source in list(sources):
                  if source.startswith("http") or source.startswith("https"):
-                    http_sources.append(source)
+                    # remove the hhtp source from the sources list
                      sources.remove(source)
  
-            # Download http sources
-            if http_sources:
-                cmd = " wget -c --directory-prefix=${SOURCES} "
-                verif = ""
-
-                for source in http_sources:
-                    cmd += " %s " % (source)
-                    verif += " ls ${SOURCES}/%s ;" % os.path.basename(source)
-                
-                # Wget output goes to stderr :S
-                cmd += " 2> /dev/null ; "
-
-                # Add verification
-                cmd += " %s " % verif
-
-                # Upload the command to a file, and execute asynchronously
-                self.upload_and_run(cmd, 
-                        "http_sources.sh", "http_sources_pid", 
-                        "http_sources_out", "http_sources_err")
+                    command.append( " ( " 
+                            # Check if the source already exists
+                            " ls ${SRC}/%(basename)s "
+                            " || ( "
+                            # If source doesn't exist, download it and check
+                            # that it it downloaded ok
+                            "   wget -c --directory-prefix=${SRC} %(source)s && "
+                            "   ls ${SRC}/%(basename)s "
+                            " ) ) " % {
+                                "basename": os.path.basename(source),
+                                "source": source
+                                })
+
+            command = " && ".join(command)
+
+            # replace application specific paths in the command
+            command = self.replace_paths(command)
+       
              if sources:
-                self.node.upload(sources, self.src_dir)
+                sources = ' '.join(sources)
+                self.node.upload(sources, self.node.src_dir, overwrite = False)
+
+        return command
+
+    def upload_files(self):
+        files = self.get("files")
+
+        if files:
+            self.info("Uploading files %s " % files)
+            self.node.upload(files, self.node.share_dir, overwrite = False)
+
+    def upload_libraries(self):
+        libs = self.get("libs")
+
+        if libs:
+            self.info("Uploading libraries %s " % libaries)
+            self.node.upload(libs, self.node.lib_dir, overwrite = False)
+
+    def upload_binaries(self):
+        bins = self.get("bins")
+
+        if bins:
+            self.info("Uploading binaries %s " % binaries)
+            self.node.upload(bins, self.node.bin_dir, overwrite = False)
  
      def upload_code(self):
          code = self.get("code")
-        if code:
-            # create dir for sources
-            self.node.mkdir(self.src_dir)
  
-            self.info(" Uploading code ")
+        if code:
+            self.info("Uploading code")
  
-            dst = os.path.join(self.src_dir, "code")
-            self.node.upload(sources, dst, text = True)
+            dst = os.path.join(self.app_home, "code")
+            self.node.upload(code, dst, overwrite = False, text = True)
  
      def upload_stdin(self):
          stdin = self.get("stdin")
          if stdin:
              # create dir for sources
-            self.info(" Uploading stdin ")
-
+            self.info("Uploading stdin")
+            
              dst = os.path.join(self.app_home, "stdin")
-            self.node.upload(stdin, dst, text = True)
+            self.node.upload(stdin, dst, overwrite = False, text = True)
  
      def install_dependencies(self):
          depends = self.get("depends")
          if depends:
-            self.info(" Installing dependencies %s" % depends)
-            self.node.install_packages(depends, home = self.app_home)
+            self.info("Installing dependencies %s" % depends)
+            self.node.install_packages(depends, self.app_home, self.run_home)
  
      def build(self):
          build = self.get("build")
+
          if build:
-            self.info(" Building sources ")
+            self.info("Building sources ")
              
-            # create dir for build
-            self.node.mkdir(self.build_dir)
-
-            # Upload the command to a file, and execute asynchronously
-            self.upload_and_run(build, 
-                    "build.sh", "build_pid", 
-                    "build_out", "build_err")
- 
+            # replace application specific paths in the command
+            return self.replace_paths(build)
+
      def install(self):
          install = self.get("install")
+
          if install:
-            self.info(" Installing sources ")
+            self.info("Installing sources ")
  
-            # Upload the command to a file, and execute asynchronously
-            self.upload_and_run(install, 
-                    "install.sh", "install_pid", 
-                    "install_out", "install_err")
+            # replace application specific paths in the command
+            return self.replace_paths(install)
  
      def deploy(self):
          # Wait until node is associated and deployed
@@ -337,107 +470,141 @@ class LinuxApplication(ResourceManager):
                  self.discover()
                  self.provision()
              except:
-                self._state = ResourceState.FAILED
+                self.fail()
                  raise
  
              super(LinuxApplication, self).deploy()
  
      def start(self):
-        command = self.get('command')
-        env = self.get('env')
-        stdin = 'stdin' if self.get('stdin') else None
-        stdout = 'stdout' if self.get('stdout') else 'stdout'
-        stderr = 'stderr' if self.get('stderr') else 'stderr'
-        sudo = self.get('sudo') or False
-        x11 = self.get('forwardX11') or False
-        failed = False
+        command = self.get("command")
  
-        super(LinuxApplication, self).start()
+        self.info("Starting command '%s'" % command)
  
          if not command:
-            self.info("No command to start ")
+            # If no command was given (i.e. Application was used for dependency
+            # installation), then the application is directly marked as FINISHED
              self._state = ResourceState.FINISHED
-            return 
-    
-        self.info("Starting command '%s'" % command)
+        else:
  
-        if x11:
-            if env:
-                # Export environment
-                environ = ""
-                for var in env.split(" "):
-                    environ += ' %s ' % var
+            if self.in_foreground:
+                self._start_in_foreground()
+            else:
+                self._start_in_background()
  
-                command = "(" + environ + " ; " + command + ")"
-                command = self.replace_paths(command)
+            super(LinuxApplication, self).start()
  
-            # If the command requires X11 forwarding, we
-            # can't run it asynchronously
-            (out, err), proc = self.node.execute(command,
-                    sudo = sudo,
-                    stdin = stdin,
-                    forward_x11 = x11)
+    def _start_in_foreground(self):
+        command = self.get("command")
+        sudo = self.get("sudo") or False
+        x11 = self.get("forwardX11")
  
-            self._state = ResourceState.FINISHED
+        # For a command being executed in foreground, if there is stdin,
+        # it is expected to be text string not a file or pipe
+        stdin = self.get("stdin") or None
+
+        # Command will be launched in foreground and attached to the
+        # terminal using the node 'execute' in non blocking mode.
+
+        # Export environment
+        env = self.get("env")
+        environ = self.node.format_environment(env, inline = True)
+        command = environ + command
+        command = self.replace_paths(command)
+
+        # We save the reference to the process in self._proc 
+        # to be able to kill the process from the stop method.
+        # We also set blocking = False, since we don't want the
+        # thread to block until the execution finishes.
+        (out, err), self._proc = self.node.execute(command,
+                sudo = sudo,
+                stdin = stdin,
+                forward_x11 = x11,
+                blocking = False)
+
+        if self._proc.poll():
+            self.fail()
+            self.error(msg, out, err)
+            raise RuntimeError, msg
  
-            if proc.poll() and err:
-                failed = True
-        else:
-            # Command was  previously uploaded, now run the remote
-            # bash file asynchronously
-            cmd = "bash ./app.sh"
-            (out, err), proc = self.node.run(cmd, self.app_home, 
-                stdin = stdin, 
-                stdout = stdout,
-                stderr = stderr,
-                sudo = sudo)
-
-            if proc.poll() and err:
-                failed = True
+    def _start_in_background(self):
+        command = self.get("command")
+        env = self.get("env")
+        sudo = self.get("sudo") or False
+
+        stdout = "stdout"
+        stderr = "stderr"
+        stdin = os.path.join(self.app_home, "stdin") if self.get("stdin") \
+                else None
+
+        # Command will be run as a daemon in baground and detached from any
+        # terminal.
+        # The command to run was previously uploaded to a bash script
+        # during deployment, now we launch the remote script using 'run'
+        # method from the node.
+        cmd = "bash %s" % os.path.join(self.app_home, "start.sh")
+        (out, err), proc = self.node.run(cmd, self.run_home, 
+            stdin = stdin, 
+            stdout = stdout,
+            stderr = stderr,
+            sudo = sudo)
+
+        # check if execution errors occurred
+        msg = " Failed to start command '%s' " % command
          
-            if not failed:
-                pid, ppid = self.node.wait_pid(home = self.app_home)
-                if pid: self._pid = int(pid)
-                if ppid: self._ppid = int(ppid)
-
-            if not self.pid or not self.ppid:
-                failed = True
- 
-            (out, chkerr), proc = self.node.check_output(self.app_home, 'stderr')
-
-            if failed or out or chkerr:
-                # check if execution errors occurred
+        if proc.poll():
+            self.fail()
+            self.error(msg, out, err)
+            raise RuntimeError, msg
+    
+        # Wait for pid file to be generated
+        pid, ppid = self.node.wait_pid(self.run_home)
+        if pid: self._pid = int(pid)
+        if ppid: self._ppid = int(ppid)
+
+        # If the process is not running, check for error information
+        # on the remote machine
+        if not self.pid or not self.ppid:
+            (out, err), proc = self.node.check_errors(self.run_home,
+                    stderr = stderr) 
+
+            # Out is what was written in the stderr file
+            if err:
+                self.fail()
                  msg = " Failed to start command '%s' " % command
-                out = out
-                if err:
-                    err = err
-                elif chkerr:
-                    err = chkerr
-
                  self.error(msg, out, err)
-
-                msg2 = " Setting state to Failed"
-                self.debug(msg2)
-                self._state = ResourceState.FAILED
-
                  raise RuntimeError, msg
-
+        
      def stop(self):
+        """ Stops application execution
+        """
          command = self.get('command') or ''
-        state = self.state
-        
-        if state == ResourceState.STARTED:
-            self.info("Stopping command '%s'" % command)
  
-            (out, err), proc = self.node.kill(self.pid, self.ppid)
+        if self.state == ResourceState.STARTED:
+            stopped = True
  
-            if out or err:
-                # check if execution errors occurred
-                msg = " Failed to STOP command '%s' " % self.get("command")
-                self.error(msg, out, err)
-                self._state = ResourceState.FAILED
-                stopped = False
+            self.info("Stopping command '%s'" % command)
+        
+            # If the command is running in foreground (it was launched using
+            # the node 'execute' method), then we use the handler to the Popen
+            # process to kill it. Else we send a kill signal using the pid and ppid
+            # retrieved after running the command with the node 'run' method
+
+            if self._proc:
+                self._proc.kill()
              else:
+                # Only try to kill the process if the pid and ppid
+                # were retrieved
+                if self.pid and self.ppid:
+                    (out, err), proc = self.node.kill(self.pid, self.ppid)
+
+                    if out or err:
+                        # check if execution errors occurred
+                        msg = " Failed to STOP command '%s' " % self.get("command")
+                        self.error(msg, out, err)
+                        self.fail()
+                        stopped = False
+
+            if stopped:
                  super(LinuxApplication, self).stop()
  
      def release(self):
@@ -448,72 +615,78 @@ class LinuxApplication(ResourceManager):
              self.node.execute(tear_down)
  
          self.stop()
+
          if self.state == ResourceState.STOPPED:
              super(LinuxApplication, self).release()
      
      @property
      def state(self):
+        """ Returns the state of the application
+        """
          if self._state == ResourceState.STARTED:
-            # To avoid overwhelming the remote hosts and the local processor
-            # with too many ssh queries, the state is only requested
-            # every 'state_check_delay' .
-            if strfdiff(strfnow(), self._last_state_check) > state_check_delay:
-                # check if execution errors occurred
-                (out, err), proc = self.node.check_output(self.app_home, 'stderr')
-
-                if out or err:
-                    if err.find("No such file or directory") >= 0 :
-                        # The resource is marked as started, but the
-                        # command was not yet executed
-                        return ResourceState.READY
-
+            if self.in_foreground:
+                # Check if the process we used to execute the command
+                # is still running ...
+                retcode = self._proc.poll()
+
+                # retcode == None -> running
+                # retcode > 0 -> error
+                # retcode == 0 -> finished
+                if retcode:
+                    out = ""
                      msg = " Failed to execute command '%s'" % self.get("command")
+                    err = self._proc.stderr.read()
                      self.error(msg, out, err)
-                    self._state = ResourceState.FAILED
-
-                elif self.pid and self.ppid:
-                    status = self.node.status(self.pid, self.ppid)
-
-                    if status == sshfuncs.FINISHED:
-                        self._state = ResourceState.FINISHED
+                    self.fail()
+                elif retcode == 0:
+                    self._state = ResourceState.FINISHED
  
-
-                self._last_state_check = strfnow()
+            else:
+                # We need to query the status of the command we launched in 
+                # background. In oredr to avoid overwhelming the remote host and
+                # the local processor with too many ssh queries, the state is only
+                # requested every 'state_check_delay' seconds.
+                state_check_delay = 0.5
+                if tdiffsec(tnow(), self._last_state_check) > state_check_delay:
+                    # check if execution errors occurred
+                    (out, err), proc = self.node.check_errors(self.run_home)
+
+                    if err:
+                        msg = " Failed to execute command '%s'" % self.get("command")
+                        self.error(msg, out, err)
+                        self.fail()
+
+                    elif self.pid and self.ppid:
+                        # No execution errors occurred. Make sure the background
+                        # process with the recorded pid is still running.
+                        status = self.node.status(self.pid, self.ppid)
+
+                        if status == ProcStatus.FINISHED:
+                            self._state = ResourceState.FINISHED
+
+                    self._last_state_check = tnow()
  
          return self._state
  
-    def upload_and_run(self, cmd, fname, pidfile, outfile, errfile):
-        dst = os.path.join(self.app_home, fname)
-        cmd = self.replace_paths(cmd)
-        self.node.upload(cmd, dst, text = True)
-
-        cmd = "bash ./%s" % fname
-        (out, err), proc = self.node.run_and_wait(cmd, self.app_home,
-            pidfile = pidfile,
-            stdout = outfile, 
-            stderr = errfile, 
-            raise_on_error = True)
-
      def replace_paths(self, command):
          """
          Replace all special path tags with shell-escaped actual paths.
          """
-        def absolute_dir(d):
-            return d if d.startswith("/") else os.path.join("${HOME}", d)
-
          return ( command
-            .replace("${SOURCES}", absolute_dir(self.src_dir))
-            .replace("${BUILD}", absolute_dir(self.build_dir))
-            .replace("${APP_HOME}", absolute_dir(self.app_home))
-            .replace("${NODE_HOME}", absolute_dir(self.node.node_home))
-            .replace("${EXP_HOME}", absolute_dir(self.node.exp_home) )
+            .replace("${USR}", self.node.usr_dir)
+            .replace("${LIB}", self.node.lib_dir)
+            .replace("${BIN}", self.node.bin_dir)
+            .replace("${SRC}", self.node.src_dir)
+            .replace("${SHARE}", self.node.share_dir)
+            .replace("${EXP}", self.node.exp_dir)
+            .replace("${EXP_HOME}", self.node.exp_home)
+            .replace("${APP_HOME}", self.app_home)
+            .replace("${RUN_HOME}", self.run_home)
+            .replace("${NODE_HOME}", self.node.node_home)
+            .replace("${HOME}", self.node.home_dir)
              )
-        
+
      def valid_connection(self, guid):
          # TODO: Validate!
          return True
-        # XXX: What if it is connected to more than one node?
-        resources = self.find_resources(exact_tags = [tags.NODE])
-        self._node = resources[0] if len(resources) == 1 else None
-        return self._node