Project

General

Profile

1 60995 alessia.ba
<RESOURCE_PROFILE>
2
    <HEADER>
3
        <RESOURCE_IDENTIFIER value="7cf3cfed-fbfb-46ca-b4da-aa43beb58f18_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/>
4
        <RESOURCE_TYPE value="WorkflowDSResourceType"/>
5
        <RESOURCE_KIND value="WorkflowDSResources"/>
6
        <RESOURCE_URI value=""/>
7
        <DATE_OF_CREATION value="2021-04-22T09:03:40+00:00"/>
8
    </HEADER>
9
    <BODY>
10
        <WORKFLOW_NAME>Update ORCID (no DOI) actionset</WORKFLOW_NAME>
11
        <WORKFLOW_TYPE>Import Infospace</WORKFLOW_TYPE>
12
        <WORKFLOW_PRIORITY>30</WORKFLOW_PRIORITY>
13
        <CONFIGURATION start="manual">
14
            <NODE isStart="true" name="setInputPath" type="SetEnvParameter">
15
                <DESCRIPTION>Set the base path containing the no_doi_dataset folder</DESCRIPTION>
16
                <PARAMETERS>
17
                    <PARAM managedBy="system" name="parameterName" required="true" type="string">inputPath</PARAM>
18
                    <PARAM managedBy="user" name="parameterValue" required="true" type="string">/data/orcid_activities_2020</PARAM>
19
                </PARAMETERS>
20
                <ARCS>
21
                    <ARC to="prepareActionSets"/>
22
                </ARCS>
23
            </NODE>
24
            <NODE name="prepareActionSets" type="PrepareActionSets">
25
                <DESCRIPTION>prepare action sets</DESCRIPTION>
26
                <PARAMETERS>
27
                    <PARAM managedBy="system" name="sets" required="true" type="string">
28
                        [
29
                        {
30
                        'set' : 'orcidworks-no-doi',
31
                        'jobProperty' : 'export_action_set_orcidworks_no_doi',
32
                        'enablingProperty' : 'active_orcidworks_no_doi',
33
                        'enabled' : 'true'
34
                        }
35
                        ]
36
                    </PARAM>
37
                </PARAMETERS>
38
                <ARCS>
39
                    <ARC to="extractOutputPath"/>
40
                </ARCS>
41
            </NODE>
42
            <NODE name="extractOutputPath" type="ExtractOutputPath">
43
                <DESCRIPTION>extract the hdfs output path generated in the previous node</DESCRIPTION>
44
                <PARAMETERS>
45
                    <PARAM managedBy="system" name="hdfsOutputPathParam" required="true" type="string">outputPath</PARAM>
46
                </PARAMETERS>
47
                <ARCS>
48
                    <ARC to="orcidNoDoiUpdate"/>
49
                </ARCS>
50
            </NODE>
51
            <NODE name="orcidNoDoiUpdate" type="SubmitHadoopJob">
52
                <DESCRIPTION>prepare updates for the Orcid No Doi</DESCRIPTION>
53
                <PARAMETERS>
54
                    <PARAM managedBy="system" name="hadoopJob" required="true" type="string">executeOozieJob</PARAM>
55
                    <PARAM managedBy="system" name="cluster" required="true" type="string">IIS</PARAM>
56
                    <PARAM managedBy="system" name="envParams" required="true" type="string">
57
                        {
58
                        'workingPath' : 'inputPath',
59
                        'outputPath': 'outputPath'
60
                        }
61
                    </PARAM>
62
                    <PARAM managedBy="system" name="params" required="true" type="string">
63
                        {
64
                        'oozie.wf.application.path' : '/lib/dnet/STABLE_IDS/actionmanager/orcidnodoi_actionset/oozie_app',
65
                        'spark2GenNoDoiDatasetMaxExecutors' : '200',
66
                        'spark2GenNoDoiDatasetExecutorMemory' : '2G'
67
                        }
68
                    </PARAM>
69
                    <PARAM managedBy="system" name="oozieReportActionsCsv" required="true" type="string">build-report</PARAM>
70
                </PARAMETERS>
71
                <ARCS>
72
                    <ARC to="updateActionSets"/>
73
                </ARCS>
74
            </NODE>
75
            <NODE name="updateActionSets" type="UpdateActionSets">
76
                <DESCRIPTION>update action sets</DESCRIPTION>
77
                <PARAMETERS/>
78
                <ARCS>
79
                    <ARC to="success"/>
80
                </ARCS>
81
            </NODE>
82
        </CONFIGURATION>
83
        <STATUS>
84
            <LAST_EXECUTION_ID>wf_20210505_073553_347</LAST_EXECUTION_ID>
85
            <LAST_EXECUTION_DATE>2021-05-05T07:43:23+00:00</LAST_EXECUTION_DATE>
86
            <LAST_EXECUTION_STATUS>SUCCESS</LAST_EXECUTION_STATUS>
87
            <LAST_EXECUTION_ERROR/>
88
        </STATUS>
89
    </BODY>
90
</RESOURCE_PROFILE>