Project

General

Profile

1
<RESOURCE_PROFILE>
2
    <HEADER>
3
        <RESOURCE_IDENTIFIER value="e03f256e-1e4d-4b3d-9c07-91faf5d25208_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/>
4
        <RESOURCE_TYPE value="WorkflowDSResourceType"/>
5
        <RESOURCE_KIND value="WorkflowDSResources"/>
6
        <RESOURCE_URI value=""/>
7
        <DATE_OF_CREATION value="2021-05-07T13:09:35+00:00"/>
8
    </HEADER>
9
    <BODY>
10
        <WORKFLOW_NAME>Import DOIboost</WORKFLOW_NAME>
11
        <WORKFLOW_TYPE>Import InfoSpace</WORKFLOW_TYPE>
12
        <WORKFLOW_PRIORITY>30</WORKFLOW_PRIORITY>
13
        <CONFIGURATION start="manual">
14
            <NODE isStart="true" name="setInputPathMAG" type="SetEnvParameter">
15
                <DESCRIPTION>set the input path for MAG</DESCRIPTION>
16
                <PARAMETERS>
17
                    <PARAM managedBy="system" name="parameterName" required="true" type="string">inputPathMAG</PARAM>
18
                    <PARAM managedBy="user" name="parameterValue" required="true" type="string">/data/doiboost/input/mag</PARAM>
19
                </PARAMETERS>
20
                <ARCS>
21
                    <ARC to="waitConfig"/>
22
                </ARCS>
23
            </NODE>
24
            <NODE isStart="true" name="setInputPathCrossref" type="SetEnvParameter">
25
                <DESCRIPTION>set the input path for Crossref</DESCRIPTION>
26
                <PARAMETERS>
27
                    <PARAM managedBy="system" name="parameterName" required="true" type="string">inputPathCrossref</PARAM>
28
                    <PARAM managedBy="user" name="parameterValue" required="true" type="string">/data/doiboost/input/crossref</PARAM>
29
                </PARAMETERS>
30
                <ARCS>
31
                    <ARC to="waitConfig"/>
32
                </ARCS>
33
            </NODE>
34
            <NODE isStart="true" name="setInputPathUnpayWall" type="SetEnvParameter">
35
                <DESCRIPTION>set the input path for UnpayWall</DESCRIPTION>
36
                <PARAMETERS>
37
                    <PARAM managedBy="system" name="parameterName" required="true" type="string">inputPathUnpayWall</PARAM>
38
                    <PARAM managedBy="user" name="parameterValue" required="true" type="string">/data/doiboost/input/unpayWall</PARAM>
39
                </PARAMETERS>
40
                <ARCS>
41
                    <ARC to="waitConfig"/>
42
                </ARCS>
43
            </NODE>
44
            <NODE isStart="true" name="setWorkingPathOrcid" type="SetEnvParameter">
45
                <DESCRIPTION>set the working path for ORCID</DESCRIPTION>
46
                <PARAMETERS>
47
                    <PARAM managedBy="system" name="parameterName" required="true" type="string">workingPathOrcid</PARAM>
48
                    <PARAM managedBy="user" name="parameterValue" required="true" type="string">/data/doiboost/input/orcid</PARAM>
49
                </PARAMETERS>
50
                <ARCS>
51
                    <ARC to="waitConfig"/>
52
                </ARCS>
53
            </NODE>
54
            <NODE isStart="true" name="setHostedByMapPath" type="SetEnvParameter">
55
                <DESCRIPTION>set the hostedBy map path</DESCRIPTION>
56
                <PARAMETERS>
57
                    <PARAM managedBy="system" name="parameterName" required="true" type="string">hostedByMapPath</PARAM>
58
                    <PARAM managedBy="user" name="parameterValue" required="true" type="string">/data/doiboost/input/hostedBy/hbMap.gz</PARAM>
59
                </PARAMETERS>
60
                <ARCS>
61
                    <ARC to="waitConfig"/>
62
                </ARCS>
63
            </NODE>
64
            <NODE isStart="true" name="setResumeFrom" type="SetEnvParameter">
65
                <DESCRIPTION>set the oozie workflow name from which the execution will be resumed</DESCRIPTION>
66
                <PARAMETERS>
67
                    <PARAM managedBy="system" name="parameterName" required="true" type="string">resumeFrom</PARAM>
68
                    <PARAM function="validValues(['ConvertCrossrefToOAF','PreprocessMag','PreprocessUW', 'ProcessORCID', 'CreateDOIBoost', 'GenerateActionSet'])" managedBy="user" name="parameterValue" required="false" type="string">ConvertCrossrefToOAF</PARAM>
69
                </PARAMETERS>
70
                <ARCS>
71
                    <ARC to="waitConfig"/>
72
                </ARCS>
73
            </NODE>
74
            <NODE isJoin="true" name="waitConfig">
75
                <DESCRIPTION>wait configurations</DESCRIPTION>
76
                <PARAMETERS/>
77
                <ARCS>
78
                    <ARC to="prepareActionSets"/>
79
                </ARCS>
80
            </NODE>
81
            <NODE name="prepareActionSets" type="PrepareActionSets">
82
                <DESCRIPTION>prepare action sets</DESCRIPTION>
83
                <PARAMETERS>
84
                    <PARAM managedBy="system" name="sets" required="true" type="string">
85
                        [
86
                        {
87
                        'set' : 'doiboost',
88
                        'jobProperty' : 'export_action_set_doiboost',
89
                        'enablingProperty' : 'active_doiboost',
90
                        'enabled' : 'true'
91
                        }
92
                        ]
93
                    </PARAM>
94
                </PARAMETERS>
95
                <ARCS>
96
                    <ARC to="extractOutputPath"/>
97
                </ARCS>
98
            </NODE>
99
            <NODE name="extractOutputPath" type="ExtractOutputPath">
100
                <DESCRIPTION>extract the hdfs output path generated in the previous node</DESCRIPTION>
101
                <PARAMETERS>
102
                    <PARAM managedBy="system" name="hdfsOutputPathParam" required="true" type="string">outputPath</PARAM>
103
                </PARAMETERS>
104
                <ARCS>
105
                    <ARC to="updateDOIBoost"/>
106
                </ARCS>
107
            </NODE>
108
            <NODE name="updateDOIBoost" type="SubmitHadoopJob">
109
                <DESCRIPTION>prepare a new version of DOIBoost</DESCRIPTION>
110
                <PARAMETERS>
111
                    <PARAM managedBy="system" name="hadoopJob" required="true" type="string">executeOozieJob</PARAM>
112
                    <PARAM managedBy="system" name="cluster" required="true" type="string">IIS</PARAM>
113
                    <PARAM managedBy="system" name="envParams" required="true" type="string">
114
                        {
115
                        'hostedByMapPath' : 'hostedByMapPath',
116
                        'inputPathMAG' : 'inputPathMAG',
117
                        'inputPathCrossref' : 'inputPathCrossref',
118
                        'inputPathUnpayWall' : 'inputPathUnpayWall',
119
                        'outputPath' : 'outputPath',
120
                        'workingPathOrcid':'workingPathOrcid',
121
                        'resumeFrom' : 'resumeFrom'
122
                        }
123
                    </PARAM>
124
                    <PARAM managedBy="system" name="params" required="true" type="string">
125
                        {
126
                        'oozie.wf.application.path' : ' /lib/dnet/PROD/doiboost/process/oozie_app',
127
                        'workingPath' : '/data/doiboost/process_p',
128
                        'sparkExecutorIntersectionMemory' : '9G',
129
                        'sparkExecutorMemory' : '6G'
130
                        }
131
                    </PARAM>
132
                    <PARAM managedBy="system" name="oozieReportActionsCsv" required="true" type="string">build-report</PARAM>
133
                </PARAMETERS>
134
                <ARCS>
135
                    <ARC to="updateActionSets"/>
136
                </ARCS>
137
            </NODE>
138
            <NODE name="updateActionSets" type="UpdateActionSets">
139
                <DESCRIPTION>update action sets</DESCRIPTION>
140
                <PARAMETERS/>
141
                <ARCS>
142
                    <ARC to="success"/>
143
                </ARCS>
144
            </NODE>
145
        </CONFIGURATION>
146
        <STATUS>
147
            <LAST_EXECUTION_ID>wf_20210512_082537_192</LAST_EXECUTION_ID>
148
            <LAST_EXECUTION_DATE>2021-05-12T10:19:27+00:00</LAST_EXECUTION_DATE>
149
            <LAST_EXECUTION_STATUS>SUCCESS</LAST_EXECUTION_STATUS>
150
            <LAST_EXECUTION_ERROR/>
151
        </STATUS>
152
    </BODY>
153
</RESOURCE_PROFILE>
(3-3/7)