Project

General

Profile

« Previous | Next » 

Revision 57413

introduced distcp workflow to synchronise data from DM to IIS cluster

View differences:

modules/dnet-openaireplus-workflows/trunk/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/hbase/distcp.xml
1
<RESOURCE_PROFILE xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
2
    <HEADER>
3
        <RESOURCE_IDENTIFIER value="37a026fd-8707-4390-9d8c-b1566d2a1e3f_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/>
4
        <RESOURCE_TYPE value="WorkflowDSResourceType"/>
5
        <RESOURCE_KIND value="WorkflowDSResources"/>
6
        <RESOURCE_URI value=""/>
7
        <DATE_OF_CREATION value="2019-10-17T08:44:46+00:00"/>
8
    </HEADER>
9
    <BODY>
10
        <WORKFLOW_NAME>distcp</WORKFLOW_NAME>
11
        <WORKFLOW_TYPE>Export InfoSpace</WORKFLOW_TYPE>
12
        <WORKFLOW_PRIORITY>30</WORKFLOW_PRIORITY>
13
        <CONFIGURATION start="manual">
14

  
15
            <NODE isStart="true" name="setSourcePath" type="SetEnvParameter">
16
                <DESCRIPTION>Set the source path on HDFS (DM)</DESCRIPTION>
17
                <PARAMETERS>
18
                    <PARAM managedBy="system" name="parameterName" required="true" type="string">sourcePath</PARAM>
19
                    <PARAM managedBy="user" name="parameterValue" required="true" type="string">/tmp/db_openaireplus_services_beta.export.2019.08.17</PARAM>
20
                </PARAMETERS>
21
                <ARCS>
22
                    <ARC to="distcp"/>
23
                </ARCS>
24
            </NODE>
25
            <NODE isStart="true" name="setTargetPath" type="SetEnvParameter">
26
                <DESCRIPTION>Set the target path on HDFS (IIS)</DESCRIPTION>
27
                <PARAMETERS>
28
                    <PARAM managedBy="system" name="parameterName" required="true" type="string">targetPath</PARAM>
29
                    <PARAM managedBy="user" name="parameterValue" required="true" type="string">/tmp</PARAM>
30
                </PARAMETERS>
31
                <ARCS>
32
                    <ARC to="distcp"/>
33
                </ARCS>
34
            </NODE>
35
            <NODE isJoin="true" name="distcp" type="SubmitHadoopJob">
36
                <DESCRIPTION>distcp</DESCRIPTION>
37
                <PARAMETERS>
38
                    <PARAM managedBy="system" name="hadoopJob" required="true" type="string">distcpJob</PARAM>
39
                    <PARAM managedBy="system" name="cluster" required="true" type="string">IIS</PARAM>
40
                    <PARAM managedBy="system" name="envParams" required="true" type="string">
41
                        {
42
                        'sourcePath' : 'sourcePath',
43
                        'targetPath' : 'targetPath'
44
                        }
45
                    </PARAM>
46
                    <PARAM managedBy="user" name="simulation" required="true" type="boolean">false</PARAM>
47
                    <PARAM managedBy="system" name="oozieReportActionsCsv" required="true" type="string">build-report</PARAM>
48
                </PARAMETERS>
49
                <ARCS>
50
                    <ARC to="success"/>
51
                </ARCS>
52
            </NODE>
53

  
54
        </CONFIGURATION>
55
        <STATUS>
56
            <LAST_EXECUTION_ID>wf_20190805_085505_893</LAST_EXECUTION_ID>
57
            <LAST_EXECUTION_DATE>2019-08-07T05:19:02+00:00</LAST_EXECUTION_DATE>
58
            <LAST_EXECUTION_STATUS>SUCCESS</LAST_EXECUTION_STATUS>
59
            <LAST_EXECUTION_ERROR/>
60
        </STATUS>
61
    </BODY>
62
</RESOURCE_PROFILE>

Also available in: Unified diff