This wiki is obsolete, see the NorduGrid web pages for up to date information.

Data stage-in

From NorduGrid
Jump to navigationJump to search

We measure the time it takes to stage in 1, 10 and 30 files (each 300 MB large) from/to machine A to/from machine B Stage-in is performed in a way that the downloader module of the A-REX service (machine A) fetches input data from the GridFTP server running on the submission machine B.

The timing of data staging only includes the time spent on actual data movement (such factors as e.g. queuing and various grid layers are excluded).


  • Stage-in job (stagein_job.xml)
<?xml version="1.0" encoding="UTF-8"?>
<JobDefinition
 xmlns="http://schemas.ggf.org/jsdl/2005/11/jsdl"
 xmlns:posix="http://schemas.ggf.org/jsdl/2005/11/jsdl-posix"
 xmlns:arc="http://www.nordugrid.org/ws/schemas/jsdl-arc">
 <JobDescription>
   <JobIdentification>
     <JobName>stagein</JobName>
   </JobIdentification>
   <Application>
     <posix:POSIXApplication>
       <posix:Executable>./stagein.py</posix:Executable>
       <posix:Output>out.txt</posix:Output>
       <posix:Error>err.txt</posix:Error>
     </posix:POSIXApplication>
   </Application>
   <DataStaging>
     <FileName>transferGSI0</FileName>
      <Source>
        <URI>
         gsiftp://pgs02.grid.upjs.sk:2811/unixacl/transferGSI
        </URI>
      </Source>
   </DataStaging>
   <DataStaging>
     <FileName>stagein.py</FileName>
       <Source><URI>stagein.py</URI></Source>
   </DataStaging>
   <DataStaging>
     <FileName>out.txt</FileName>
   </DataStaging>
   <DataStaging>
     <FileName>err.txt</FileName>
   </DataStaging>
 </JobDescription>
</JobDefinition>