1 |
57299
|
sandro.lab
|
<NODE name="SET_INFO" isStart="true" type="SetProviderInfo">
|
2 |
|
|
<DESCRIPTION>Set information about current provider</DESCRIPTION>
|
3 |
|
|
<PARAMETERS>
|
4 |
|
|
<PARAM required="true" type="string" name="providerId" managedBy="system">$params.("dataprovider:id")$</PARAM>
|
5 |
|
|
<PARAM required="true" type="string" name="providerName" managedBy="system">$params.("dataprovider:name")$</PARAM>
|
6 |
|
|
<PARAM required="true" type="string" name="api" managedBy="system">$params.("dataprovider:interface")$</PARAM>
|
7 |
|
|
</PARAMETERS>
|
8 |
|
|
<ARCS>
|
9 |
|
|
<ARC to="obtainParams" />
|
10 |
|
|
</ARCS>
|
11 |
|
|
</NODE>
|
12 |
|
|
|
13 |
|
|
<NODE name="obtainParams" type="ObtainOpenaireDataSourceParams">
|
14 |
|
|
<DESCRIPTION>Fetch records from MDStore</DESCRIPTION>
|
15 |
|
|
<PARAMETERS>
|
16 |
|
|
<PARAM required="true" type="string" name="providerId" managedBy="system">$params.("dataprovider:id")$</PARAM>
|
17 |
|
|
</PARAMETERS>
|
18 |
|
|
<ARCS>
|
19 |
60316
|
claudio.at
|
<ARC to="PREPARE_ENV_TRANSFORMATION"/>
|
20 |
57299
|
sandro.lab
|
</ARCS>
|
21 |
|
|
</NODE>
|
22 |
|
|
|
23 |
|
|
<NODE name="PREPARE_ENV_TRANSFORMATION" type="PrepareEnvTransformHadoopJobNode">
|
24 |
|
|
<DESCRIPTION>Retrieve all the parameters needed to run the transformation workflow</DESCRIPTION>
|
25 |
|
|
<PARAMETERS>
|
26 |
|
|
<PARAM category="TRANSFORMATION_RULE_ID" function="listProfiles('TransformationRuleDSResourceType', '//TITLE')" managedBy="user" name="ruleId" required="true" type="string"></PARAM>
|
27 |
60318
|
claudio.at
|
<PARAM required="true" type="string" name="mdstoreInput" managedBy="system" category="MDSTORE_ID">$params.("harv_id")$</PARAM>
|
28 |
|
|
<PARAM required="true" type="string" name="mdstoreOutput" managedBy="system" category="MDSTORE_ID">$params.("tran_id")$</PARAM>
|
29 |
57299
|
sandro.lab
|
</PARAMETERS>
|
30 |
|
|
<ARCS>
|
31 |
|
|
<ARC to="TRANSFORM_HADOOP"/>
|
32 |
|
|
</ARCS>
|
33 |
|
|
</NODE>
|
34 |
60316
|
claudio.at
|
|
35 |
60452
|
claudio.at
|
<NODE name="TRANSFORM_HADOOP" type="SubmitDnetHadoopJobNode">
|
36 |
57299
|
sandro.lab
|
<DESCRIPTION>Start the Hadoop Job</DESCRIPTION>
|
37 |
|
|
<PARAMETERS>
|
38 |
60316
|
claudio.at
|
<PARAM managedBy="system" name="hadoopJob" required="true" type="string">executeOozieJob</PARAM>
|
39 |
57299
|
sandro.lab
|
<PARAM managedBy="user" name="cluster" required="true" type="string">DHP</PARAM>
|
40 |
|
|
<PARAM managedBy="system" name="envParams" required="true" type="string">
|
41 |
|
|
{
|
42 |
60342
|
claudio.at
|
"mdStoreInputId":"mdstoreInput",
|
43 |
|
|
"mdStoreOutputId":"mdstoreOutput",
|
44 |
|
|
"transformationRuleId":"transformationRule",
|
45 |
|
|
"dateOfTransformation":"timestamp",
|
46 |
60318
|
claudio.at
|
"workflowId":"workflowId",
|
47 |
|
|
"oozie.wf.application.path":"oozieWfPath"
|
48 |
57299
|
sandro.lab
|
}
|
49 |
|
|
</PARAM>
|
50 |
60342
|
claudio.at
|
<PARAM managedBy="system" name="params" required="true" type="string">
|
51 |
|
|
{
|
52 |
|
|
'transformationPlugin':'XSLT_TRANSFORM'
|
53 |
|
|
}
|
54 |
|
|
</PARAM>
|
55 |
60452
|
claudio.at
|
<PARAM managedBy="system" name="oozieReportActionsCsv" required="true" type="string">CommitVersion</PARAM>
|
56 |
57299
|
sandro.lab
|
</PARAMETERS>
|
57 |
|
|
<ARCS>
|
58 |
|
|
<ARC to="UPDATE_INFO"/>
|
59 |
|
|
</ARCS>
|
60 |
|
|
</NODE>
|
61 |
|
|
|
62 |
|
|
<NODE name="UPDATE_INFO" type="MDStoreToApiExtraFieldHadoop">
|
63 |
|
|
<DESCRIPTION>Update datasouce API extra fields</DESCRIPTION>
|
64 |
|
|
<PARAMETERS>
|
65 |
|
|
<PARAM required="true" type="string" name="mdId" managedBy="system">$params.("tran_id")$</PARAM>
|
66 |
|
|
<PARAM required="true" type="string" name="datasourceId" managedBy="system">$params.("dataprovider:id")$</PARAM>
|
67 |
|
|
<PARAM required="true" type="string" name="datasourceInterface" managedBy="system">$params.("dataprovider:interface")$</PARAM>
|
68 |
|
|
<PARAM required="true" type="string" name="extraFieldForTotal" managedBy="system">last_aggregation_total</PARAM>
|
69 |
|
|
<PARAM required="true" type="string" name="extraFieldForDate" managedBy="system">last_aggregation_date</PARAM>
|
70 |
|
|
<PARAM required="true" type="string" name="extraFieldForMdId" managedBy="system">last_aggregation_mdId</PARAM>
|
71 |
|
|
</PARAMETERS>
|
72 |
|
|
<ARCS>
|
73 |
|
|
<ARC to="success"/>
|
74 |
|
|
</ARCS>
|
75 |
|
|
</NODE>
|