Revision 49303
Added by Claudio Atzori over 6 years ago
modules/dnet-openaireplus-workflows/branches/solr6/deploy.info | ||
---|---|---|
1 |
{"type_source": "SVN", "goal": "package -U source:jar", "url": "http://svn-public.driver.research-infrastructures.eu/driver/dnet45/modules/dnet-openaireplus-workflows/branches/solr6/", "deploy_repository": "dnet45-snapshots", "version": "4", "mail": "sandro.labruzzo@isti.cnr.it,michele.artini@isti.cnr.it, claudio.atzori@isti.cnr.it, alessia.bardi@isti.cnr.it", "deploy_repository_url": "http://maven.research-infrastructures.eu/nexus/content/repositories/dnet45-snapshots", "name": "dnet-openaireplus-workflows"} |
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/hbase/claims2hbase.xml | ||
---|---|---|
1 |
<RESOURCE_PROFILE> |
|
2 |
<HEADER> |
|
3 |
<RESOURCE_IDENTIFIER value="001ca627-1ae1-4053-9243-bca6ee149b22_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
4 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
5 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
6 |
<RESOURCE_URI value=""/> |
|
7 |
<DATE_OF_CREATION value="2017-06-24T18:13:51.0Z"/> |
|
8 |
</HEADER> |
|
9 |
<BODY> |
|
10 |
<WORKFLOW_NAME>Claim to HBase</WORKFLOW_NAME> |
|
11 |
<WORKFLOW_TYPE>Data Load</WORKFLOW_TYPE> |
|
12 |
<WORKFLOW_PRIORITY>30</WORKFLOW_PRIORITY> |
|
13 |
<CONFIGURATION start="manual"> |
|
14 |
<NODE name="applyClaimRels" type="ApplyClaimRels" isStart="true"> |
|
15 |
<DESCRIPTION>Apply Claim Rels</DESCRIPTION> |
|
16 |
<PARAMETERS> |
|
17 |
<PARAM managedBy="system" name="clusterName" required="true" type="string">DM</PARAM> |
|
18 |
<PARAM managedBy="user" name="tableName" required="true" type="string"></PARAM> |
|
19 |
<PARAM managedBy="user" name="sql" required="true" type="string">SELECT source_type, source_id, target_type, target_id, semantics FROM claim WHERE approved=TRUE AND source_type !='context'</PARAM> |
|
20 |
<PARAM managedBy="user" name="countQuery" required="true" type="string">SELECT count(*) FROM claim WHERE approved=TRUE AND source_type !='context'</PARAM> |
|
21 |
</PARAMETERS> |
|
22 |
<ARCS> |
|
23 |
<ARC to="applyClaimUpdates"/> |
|
24 |
</ARCS> |
|
25 |
</NODE> |
|
26 |
<NODE name="applyClaimUpdates" type="ApplyClaimUpdates"> |
|
27 |
<DESCRIPTION>Apply Claim Updates</DESCRIPTION> |
|
28 |
<PARAMETERS> |
|
29 |
<PARAM managedBy="system" name="clusterName" required="true" type="string">DM</PARAM> |
|
30 |
<PARAM managedBy="user" name="tableName" required="true" type="string"></PARAM> |
|
31 |
<PARAM managedBy="user" name="sql" required="true" type="string">SELECT source_type, source_id, target_type, target_id, semantics FROM claim WHERE approved=TRUE AND source_type ='context'</PARAM> |
|
32 |
<PARAM managedBy="user" name="countQuery" required="true" type="string">SELECT count(*) FROM claim WHERE approved=TRUE AND source_type ='context'</PARAM> |
|
33 |
</PARAMETERS> |
|
34 |
<ARCS> |
|
35 |
<ARC to="success"/> |
|
36 |
</ARCS> |
|
37 |
</NODE> |
|
38 |
</CONFIGURATION> |
|
39 |
<STATUS> |
|
40 |
</STATUS> |
|
41 |
</BODY> |
|
42 |
</RESOURCE_PROFILE> |
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/hbase/odf2hbase.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER |
|
5 |
value="939f1075-70ed-4fbd-9055-ea16e5984531_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
6 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
7 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
8 |
<RESOURCE_URI value=""/> |
|
9 |
<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z"/> |
|
10 |
</HEADER> |
|
11 |
<BODY> |
|
12 |
<WORKFLOW_NAME>ODF to HBase</WORKFLOW_NAME> |
|
13 |
<WORKFLOW_TYPE>Data Load</WORKFLOW_TYPE> |
|
14 |
<WORKFLOW_PRIORITY>30</WORKFLOW_PRIORITY> |
|
15 |
<CONFIGURATION start="manual"> |
|
16 |
<NODE name="setTable" type="SetHBaseTable" isStart="true"> |
|
17 |
<DESCRIPTION>set hbase table</DESCRIPTION> |
|
18 |
<PARAMETERS> |
|
19 |
<PARAM name="table" type="string" managedBy="user" required="true"></PARAM> |
|
20 |
</PARAMETERS> |
|
21 |
<ARCS> |
|
22 |
<ARC to="mapreduce"/> |
|
23 |
</ARCS> |
|
24 |
</NODE> |
|
25 |
|
|
26 |
<NODE name="prepareImport" type="PrepareMDStoreImport" isStart="true"> |
|
27 |
<DESCRIPTION>Configure export to HDFS</DESCRIPTION> |
|
28 |
<PARAMETERS> |
|
29 |
<PARAM required="true" type="string" name="hdfsPathParam" managedBy="system">hdfsPath</PARAM> |
|
30 |
<PARAM required="true" type="string" name="hdfsPath" managedBy="user">/tmp/mdstores_odf-store-cleaned.seq</PARAM> |
|
31 |
<PARAM required="true" type="string" name="mappingParam" managedBy="system">xslt</PARAM> |
|
32 |
<PARAM required="true" type="string" name="mapping" managedBy="user" function="obtainValues('odf2hbaseMappings', {})"></PARAM> |
|
33 |
</PARAMETERS> |
|
34 |
<ARCS> |
|
35 |
<ARC to="reuseHdfsRecords"/> |
|
36 |
</ARCS> |
|
37 |
</NODE> |
|
38 |
<NODE name="reuseHdfsRecords" type="ReuseHdfsRecords"> |
|
39 |
<DESCRIPTION>reuse mdstore records</DESCRIPTION> |
|
40 |
<PARAMETERS> |
|
41 |
<PARAM required="true" type="boolean" name="reuseMdRecords" managedBy="user">false</PARAM> |
|
42 |
</PARAMETERS> |
|
43 |
<ARCS> |
|
44 |
<ARC name="true" to="doneExport"/> |
|
45 |
<ARC name="false" to="exportRecords"/> |
|
46 |
</ARCS> |
|
47 |
</NODE> |
|
48 |
<NODE name="exportRecords" type="MDStoreBatchExporter"> |
|
49 |
<DESCRIPTION>Fetch mdstore records</DESCRIPTION> |
|
50 |
<PARAMETERS> |
|
51 |
<PARAM required="true" type="string" name="format" managedBy="system">ODF</PARAM> |
|
52 |
<PARAM required="true" type="string" name="layout" managedBy="system">store</PARAM> |
|
53 |
<PARAM required="true" type="string" name="interpretation" managedBy="system">cleaned</PARAM> |
|
54 |
<PARAM required="true" type="string" name="outputEprParam" managedBy="system">records_epr</PARAM> |
|
55 |
</PARAMETERS> |
|
56 |
<ARCS> |
|
57 |
<ARC to="storeHdfsRecords"/> |
|
58 |
</ARCS> |
|
59 |
</NODE> |
|
60 |
<NODE name="storeHdfsRecords" type="StoreHdfsRecords"> |
|
61 |
<DESCRIPTION>Store records to HDFS</DESCRIPTION> |
|
62 |
<PARAMETERS> |
|
63 |
<PARAM required="true" type="string" name="inputEprParam" managedBy="system">records_epr</PARAM> |
|
64 |
<PARAM required="true" type="string" name="hdfsPathParam" managedBy="system">hdfsPath</PARAM> |
|
65 |
<PARAM required="true" type="string" name="cluster" managedBy="system">DM</PARAM> |
|
66 |
</PARAMETERS> |
|
67 |
<ARCS> |
|
68 |
<ARC to="doneExport"/> |
|
69 |
</ARCS> |
|
70 |
</NODE> |
|
71 |
<NODE name="doneExport"> |
|
72 |
<DESCRIPTION></DESCRIPTION> |
|
73 |
<PARAMETERS/> |
|
74 |
<ARCS> |
|
75 |
<ARC to="mapreduce"/> |
|
76 |
</ARCS> |
|
77 |
</NODE> |
|
78 |
<NODE name="mapreduce" type="SubmitHadoopJob" isJoin="true"> |
|
79 |
<DESCRIPTION>Run M/R import Job</DESCRIPTION> |
|
80 |
<PARAMETERS> |
|
81 |
<PARAM required="true" type="string" name="cluster" managedBy="system">DM</PARAM> |
|
82 |
<PARAM required="true" type="string" name="hadoopJob" managedBy="system">mdStoreHdfsImportJob</PARAM> |
|
83 |
<PARAM required="true" type="boolean" name="simulation" managedBy="user">false</PARAM> |
|
84 |
<PARAM required="true" type="string" name="envParams" managedBy="system"> |
|
85 |
{ |
|
86 |
'mapred.input.dir' : 'hdfsPath', |
|
87 |
'hbase.import.xslt' : 'xslt', |
|
88 |
'hbase.mapred.outputtable' : 'hbaseTable' |
|
89 |
} |
|
90 |
</PARAM> |
|
91 |
</PARAMETERS> |
|
92 |
<ARCS> |
|
93 |
<ARC to="success"/> |
|
94 |
</ARCS> |
|
95 |
</NODE> |
|
96 |
</CONFIGURATION> |
|
97 |
<STATUS/> |
|
98 |
</BODY> |
|
99 |
</RESOURCE_PROFILE> |
|
100 |
|
|
101 |
|
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/hbase/importActionsFromHDFS.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER |
|
5 |
value="cbfb388a-c184-4a88-be66-0f1d3bb61fe5_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
6 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
7 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
8 |
<RESOURCE_URI value=""/> |
|
9 |
<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z"/> |
|
10 |
</HEADER> |
|
11 |
<BODY> |
|
12 |
<WORKFLOW_NAME>Actions from HDFS</WORKFLOW_NAME> |
|
13 |
<WORKFLOW_TYPE>Data Load</WORKFLOW_TYPE> |
|
14 |
<WORKFLOW_PRIORITY>30</WORKFLOW_PRIORITY> |
|
15 |
<CONFIGURATION start="manual"> |
|
16 |
<NODE name="hadoopConfig" type="SetClusterAndTable" isStart="true"> |
|
17 |
<DESCRIPTION>Set table name</DESCRIPTION> |
|
18 |
<PARAMETERS> |
|
19 |
<PARAM required="true" type="string" name="cluster" managedBy="system">DM</PARAM> |
|
20 |
<PARAM required="true" type="string" name="tableParam" managedBy="system">tableName</PARAM> |
|
21 |
<PARAM required="true" type="string" name="table" managedBy="user"></PARAM> |
|
22 |
</PARAMETERS> |
|
23 |
<ARCS> |
|
24 |
<ARC to="importMapreduce"/> |
|
25 |
</ARCS> |
|
26 |
</NODE> |
|
27 |
<NODE name="setActionsPath" type="SetEnvParameter" isStart="true"> |
|
28 |
<DESCRIPTION>Set the sequence file path on HDFS holding the exported Actions</DESCRIPTION> |
|
29 |
<PARAMETERS> |
|
30 |
<PARAM managedBy="system" name="parameterName" required="true" type="string">actionsPath</PARAM> |
|
31 |
<PARAM managedBy="user" name="parameterValue" required="true" type="string">/tmp/2016-03-25_iis_preprocessing/document_referencedDatasets/rawset_76cfeefd-1139-4a30-a394-f01bf67220bf_1458652954774</PARAM> |
|
32 |
</PARAMETERS> |
|
33 |
<ARCS> |
|
34 |
<ARC to="importMapreduce"/> |
|
35 |
</ARCS> |
|
36 |
</NODE> |
|
37 |
|
|
38 |
<NODE name="importMapreduce" type="SubmitHadoopJob" isJoin="true"> |
|
39 |
<DESCRIPTION>Run M/R import Job</DESCRIPTION> |
|
40 |
<PARAMETERS> |
|
41 |
<PARAM required="true" type="string" name="hadoopJob" managedBy="system">actionsImportJob</PARAM> |
|
42 |
<PARAM required="true" type="string" name="envParams" managedBy="system"> |
|
43 |
{ |
|
44 |
'cluster' : 'cluster', |
|
45 |
'mapred.input.dir' : 'actionsPath', |
|
46 |
'hbase.mapred.outputtable' : 'tableName' |
|
47 |
} |
|
48 |
</PARAM> |
|
49 |
<PARAM required="true" type="boolean" name="simulation" managedBy="user">false</PARAM> |
|
50 |
</PARAMETERS> |
|
51 |
<ARCS> |
|
52 |
<ARC to="success"/> |
|
53 |
</ARCS> |
|
54 |
</NODE> |
|
55 |
|
|
56 |
</CONFIGURATION> |
|
57 |
<STATUS/> |
|
58 |
</BODY> |
|
59 |
</RESOURCE_PROFILE> |
|
60 |
|
|
61 |
|
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/hbase/actions2hbase.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER value="4b8dabb8-cef7-4910-a0ad-fd8e70d53b9e_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
5 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
6 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
7 |
<RESOURCE_URI value=""/> |
|
8 |
<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z"/> |
|
9 |
</HEADER> |
|
10 |
<BODY> |
|
11 |
<WORKFLOW_NAME>Actions to HBase</WORKFLOW_NAME> |
|
12 |
<WORKFLOW_TYPE>Data Load</WORKFLOW_TYPE> |
|
13 |
<WORKFLOW_PRIORITY>30</WORKFLOW_PRIORITY> |
|
14 |
<CONFIGURATION start="auto"> |
|
15 |
<NODE name="promoteActions" type="PromoteActions" isStart="true"> |
|
16 |
<DESCRIPTION>Promote actions</DESCRIPTION> |
|
17 |
<PARAMETERS> |
|
18 |
<PARAM function="obtainValues('actionSets', {})" required="false" type="string" name="set" managedBy="user">ALL SETS</PARAM> |
|
19 |
</PARAMETERS> |
|
20 |
<ARCS> |
|
21 |
<ARC to="success"/> |
|
22 |
</ARCS> |
|
23 |
</NODE> |
|
24 |
</CONFIGURATION> |
|
25 |
<STATUS/> |
|
26 |
</BODY> |
|
27 |
</RESOURCE_PROFILE> |
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/hbase/resetHbase.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER value="ce304c65-5836-4cf0-9a48-53472b9f6f35_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
5 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
6 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
7 |
<RESOURCE_URI value=""/> |
|
8 |
<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z"/> |
|
9 |
</HEADER> |
|
10 |
<BODY> |
|
11 |
<WORKFLOW_NAME>Reset HBase</WORKFLOW_NAME> |
|
12 |
<WORKFLOW_TYPE>Data Load</WORKFLOW_TYPE> |
|
13 |
<WORKFLOW_PRIORITY>30</WORKFLOW_PRIORITY> |
|
14 |
<CONFIGURATION start="auto"> |
|
15 |
<NODE name="checkTable" type="CheckHBaseTable" isStart="true"> |
|
16 |
<DESCRIPTION>check hbase table</DESCRIPTION> |
|
17 |
<PARAMETERS> |
|
18 |
<PARAM name="hbaseTableProperty" type="string" managedBy="system" required="true">hbase.mapred.datatable</PARAM> |
|
19 |
<PARAM name="cluster" type="string" managedBy="system" required="true">DM</PARAM> |
|
20 |
<PARAM name="tableColumnsParamName" type="string" managedBy="system" required="true">hTableColumns</PARAM> |
|
21 |
<PARAM name="existOutNode" type="string" managedBy="system" required="true">drop</PARAM> |
|
22 |
<PARAM name="dontExistOutNode" type="string" required="true" managedBy="system">define</PARAM> |
|
23 |
</PARAMETERS> |
|
24 |
<ARCS> |
|
25 |
<ARC to="drop" name="drop"/> |
|
26 |
<ARC to="define" name="define"/> |
|
27 |
</ARCS> |
|
28 |
</NODE> |
|
29 |
<NODE name="drop" type="DropHBaseTable"> |
|
30 |
<DESCRIPTION>drop hbase table</DESCRIPTION> |
|
31 |
<PARAMETERS> |
|
32 |
<PARAM name="hbaseTableProperty" type="string" managedBy="system" required="true">hbase.mapred.datatable</PARAM> |
|
33 |
<PARAM name="cluster" type="string" managedBy="system" required="true">DM</PARAM> |
|
34 |
</PARAMETERS> |
|
35 |
<ARCS> |
|
36 |
<ARC to="define"/> |
|
37 |
</ARCS> |
|
38 |
</NODE> |
|
39 |
<NODE name="define" type="DefineHBaseOpenaireSchema"> |
|
40 |
<DESCRIPTION>define OpenAIRE hbase table</DESCRIPTION> |
|
41 |
<PARAMETERS> |
|
42 |
<PARAM name="tableColumnsParamName" type="string" managedBy="system" required="true">hTableColumns</PARAM> |
|
43 |
<PARAM name="hbaseTableProperty" type="string" managedBy="system" required="true">hbase.mapred.datatable</PARAM> |
|
44 |
<PARAM name="cluster" type="string" managedBy="system" required="true">DM</PARAM> |
|
45 |
</PARAMETERS> |
|
46 |
<ARCS> |
|
47 |
<ARC to="create"/> |
|
48 |
</ARCS> |
|
49 |
</NODE> |
|
50 |
<NODE name="create" type="CreateHBaseTable"> |
|
51 |
<DESCRIPTION>create hbase table</DESCRIPTION> |
|
52 |
<PARAMETERS> |
|
53 |
<PARAM name="hbaseTableProperty" type="string" managedBy="system" required="true">hbase.mapred.datatable</PARAM> |
|
54 |
<PARAM name="cluster" type="string" managedBy="system" required="true">DM</PARAM> |
|
55 |
<PARAM name="tableColumnsParamName" type="string" managedBy="system" required="true">hTableColumns</PARAM> |
|
56 |
</PARAMETERS> |
|
57 |
<ARCS> |
|
58 |
<ARC to="success"/> |
|
59 |
</ARCS> |
|
60 |
</NODE> |
|
61 |
</CONFIGURATION> |
|
62 |
<STATUS/> |
|
63 |
</BODY> |
|
64 |
</RESOURCE_PROFILE> |
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/hbase/db2hbase.xml | ||
---|---|---|
1 |
<RESOURCE_PROFILE> |
|
2 |
<HEADER> |
|
3 |
<RESOURCE_IDENTIFIER value="e92d2f81-ea98-4732-a306-07da87f35033_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
4 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
5 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
6 |
<RESOURCE_URI value=""/> |
|
7 |
<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z"/> |
|
8 |
</HEADER> |
|
9 |
<BODY> |
|
10 |
<WORKFLOW_NAME>DB to HBase</WORKFLOW_NAME> |
|
11 |
<WORKFLOW_TYPE>Data Load</WORKFLOW_TYPE> |
|
12 |
<WORKFLOW_PRIORITY>30</WORKFLOW_PRIORITY> |
|
13 |
<CONFIGURATION start="manual"> |
|
14 |
<NODE isStart="true" name="start"> |
|
15 |
<DESCRIPTION>start</DESCRIPTION> |
|
16 |
<PARAMETERS/> |
|
17 |
<ARCS> |
|
18 |
<ARC to="prepareQueryDatasources"/> |
|
19 |
</ARCS> |
|
20 |
</NODE> |
|
21 |
<NODE name="prepareQueryDatasources" type="ExecuteSql"> |
|
22 |
<DESCRIPTION>query Datasources</DESCRIPTION> |
|
23 |
<PARAMETERS> |
|
24 |
<PARAM managedBy="system" name="dbProperty" required="true" type="string">dnet.openaire.db.name</PARAM> |
|
25 |
<PARAM managedBy="system" name="sql" required="true" type="string"> |
|
26 |
/eu/dnetlib/msro/openaireplus/workflows/hbase/prepareQueryDatasources.sql |
|
27 |
</PARAM> |
|
28 |
</PARAMETERS> |
|
29 |
<ARCS> |
|
30 |
<ARC to="queryDatasources"/> |
|
31 |
</ARCS> |
|
32 |
</NODE> |
|
33 |
<NODE name="queryDatasources" type="QueryDb"> |
|
34 |
<DESCRIPTION>query Datasources</DESCRIPTION> |
|
35 |
<PARAMETERS> |
|
36 |
<PARAM managedBy="system" name="dbProperty" required="true" type="string">dnet.openaire.db.name</PARAM> |
|
37 |
<PARAM managedBy="system" name="sql" required="true" type="string">/eu/dnetlib/msro/openaireplus/workflows/hbase/queryDatasources.sql |
|
38 |
</PARAM> |
|
39 |
<PARAM managedBy="system" name="sqlForSize" required="true" type="string"> |
|
40 |
/eu/dnetlib/msro/openaireplus/workflows/hbase/queryDatasourcesForSize.sql |
|
41 |
</PARAM> |
|
42 |
<PARAM managedBy="system" name="outputEprParam" required="true" type="string">dsEpr</PARAM> |
|
43 |
</PARAMETERS> |
|
44 |
<ARCS> |
|
45 |
<ARC to="storeDatasources"/> |
|
46 |
</ARCS> |
|
47 |
</NODE> |
|
48 |
<NODE name="storeDatasources" type="StoreHBase"> |
|
49 |
<DESCRIPTION>Store Datasources to HBase</DESCRIPTION> |
|
50 |
<PARAMETERS> |
|
51 |
<PARAM managedBy="system" name="inputEprParam" required="true" type="string">dsEpr</PARAM> |
|
52 |
<PARAM managedBy="system" name="hbaseTableProperty" required="true" type="string">hbase.mapred.datatable</PARAM> |
|
53 |
<PARAM managedBy="system" name="cluster" required="true" type="string">DM</PARAM> |
|
54 |
<PARAM managedBy="user" name="mapping" required="true" type="string" function="obtainValues('dbmf2hbaseMappings', {})"></PARAM> |
|
55 |
</PARAMETERS> |
|
56 |
<ARCS> |
|
57 |
<ARC to="queryDatasourceOrganization"/> |
|
58 |
</ARCS> |
|
59 |
</NODE> |
|
60 |
<NODE name="queryDatasourceOrganization" type="QueryDb"> |
|
61 |
<DESCRIPTION>query relation Datasource_Organization</DESCRIPTION> |
|
62 |
<PARAMETERS> |
|
63 |
<PARAM managedBy="system" name="dbProperty" required="true" type="string">dnet.openaire.db.name</PARAM> |
|
64 |
<PARAM managedBy="system" name="sql" required="true" type="string"> |
|
65 |
/eu/dnetlib/msro/openaireplus/workflows/hbase/queryDatasourceOrganization.sql |
|
66 |
</PARAM> |
|
67 |
<PARAM managedBy="system" name="outputEprParam" required="true" type="string">dsOrgEpr</PARAM> |
|
68 |
</PARAMETERS> |
|
69 |
<ARCS> |
|
70 |
<ARC to="storeDatasourceOrganization"/> |
|
71 |
</ARCS> |
|
72 |
</NODE> |
|
73 |
<NODE name="storeDatasourceOrganization" type="StoreHBase"> |
|
74 |
<DESCRIPTION>Store relation Datasource_Organization</DESCRIPTION> |
|
75 |
<PARAMETERS> |
|
76 |
<PARAM managedBy="system" name="inputEprParam" required="true" type="string">dsOrgEpr</PARAM> |
|
77 |
<PARAM managedBy="system" name="hbaseTableProperty" required="true" type="string">hbase.mapred.datatable</PARAM> |
|
78 |
<PARAM managedBy="system" name="cluster" required="true" type="string">DM</PARAM> |
|
79 |
<PARAM managedBy="user" name="mapping" required="true" type="string" function="obtainValues('dbmf2hbaseMappings', {})"></PARAM> |
|
80 |
</PARAMETERS> |
|
81 |
<ARCS> |
|
82 |
<ARC to="queryOrganizations"/> |
|
83 |
</ARCS> |
|
84 |
</NODE> |
|
85 |
<NODE name="queryOrganizations" type="QueryDb"> |
|
86 |
<DESCRIPTION>query Organizations</DESCRIPTION> |
|
87 |
<PARAMETERS> |
|
88 |
<PARAM managedBy="system" name="dbProperty" required="true" type="string">dnet.openaire.db.name</PARAM> |
|
89 |
<PARAM managedBy="system" name="sql" required="true" type="string">/eu/dnetlib/msro/openaireplus/workflows/hbase/queryOrganizations.sql |
|
90 |
</PARAM> |
|
91 |
<PARAM managedBy="system" name="outputEprParam" required="true" type="string">orgEpr</PARAM> |
|
92 |
</PARAMETERS> |
|
93 |
<ARCS> |
|
94 |
<ARC to="storeOrganizations"/> |
|
95 |
</ARCS> |
|
96 |
</NODE> |
|
97 |
<NODE name="storeOrganizations" type="StoreHBase"> |
|
98 |
<DESCRIPTION>Store Organizations to HBase</DESCRIPTION> |
|
99 |
<PARAMETERS> |
|
100 |
<PARAM managedBy="system" name="inputEprParam" required="true" type="string">orgEpr</PARAM> |
|
101 |
<PARAM managedBy="system" name="hbaseTableProperty" required="true" type="string">hbase.mapred.datatable</PARAM> |
|
102 |
<PARAM managedBy="system" name="cluster" required="true" type="string">DM</PARAM> |
|
103 |
<PARAM managedBy="user" name="mapping" required="true" type="string" function="obtainValues('dbmf2hbaseMappings', {})"></PARAM> |
|
104 |
</PARAMETERS> |
|
105 |
<ARCS> |
|
106 |
<ARC to="queryProjects"/> |
|
107 |
</ARCS> |
|
108 |
</NODE> |
|
109 |
<NODE name="queryProjects" type="QueryDb"> |
|
110 |
<DESCRIPTION>query Projects</DESCRIPTION> |
|
111 |
<PARAMETERS> |
|
112 |
<PARAM managedBy="system" name="dbProperty" required="true" type="string">dnet.openaire.db.name</PARAM> |
|
113 |
<PARAM managedBy="system" name="sql" required="true" type="string">/eu/dnetlib/msro/openaireplus/workflows/hbase/queryProjects.sql</PARAM> |
|
114 |
<PARAM managedBy="system" name="outputEprParam" required="true" type="string">projEpr</PARAM> |
|
115 |
</PARAMETERS> |
|
116 |
<ARCS> |
|
117 |
<ARC to="storeProjects"/> |
|
118 |
</ARCS> |
|
119 |
</NODE> |
|
120 |
<NODE name="storeProjects" type="StoreHBase"> |
|
121 |
<DESCRIPTION>Store Projects to HBase</DESCRIPTION> |
|
122 |
<PARAMETERS> |
|
123 |
<PARAM managedBy="system" name="inputEprParam" required="true" type="string">projEpr</PARAM> |
|
124 |
<PARAM managedBy="system" name="hbaseTableProperty" required="true" type="string">hbase.mapred.datatable</PARAM> |
|
125 |
<PARAM managedBy="system" name="cluster" required="true" type="string">DM</PARAM> |
|
126 |
<PARAM managedBy="user" name="mapping" required="true" type="string" function="obtainValues('dbmf2hbaseMappings', {})"></PARAM> |
|
127 |
</PARAMETERS> |
|
128 |
<ARCS> |
|
129 |
<ARC to="queryProjectOrganization"/> |
|
130 |
</ARCS> |
|
131 |
</NODE> |
|
132 |
<NODE name="queryProjectOrganization" type="QueryDb"> |
|
133 |
<DESCRIPTION>query relation Project_Organization</DESCRIPTION> |
|
134 |
<PARAMETERS> |
|
135 |
<PARAM managedBy="system" name="dbProperty" required="true" type="string">dnet.openaire.db.name</PARAM> |
|
136 |
<PARAM managedBy="system" name="sql" required="true" type="string"> |
|
137 |
/eu/dnetlib/msro/openaireplus/workflows/hbase/queryProjectOrganization.sql |
|
138 |
</PARAM> |
|
139 |
<PARAM managedBy="system" name="outputEprParam" required="true" type="string">projOrgEpr</PARAM> |
|
140 |
</PARAMETERS> |
|
141 |
<ARCS> |
|
142 |
<ARC to="storeProjectOrganization"/> |
|
143 |
</ARCS> |
|
144 |
</NODE> |
|
145 |
<NODE name="storeProjectOrganization" type="StoreHBase"> |
|
146 |
<DESCRIPTION>Store relation Project_Organizations</DESCRIPTION> |
|
147 |
<PARAMETERS> |
|
148 |
<PARAM managedBy="system" name="inputEprParam" required="true" type="string">projOrgEpr</PARAM> |
|
149 |
<PARAM managedBy="system" name="hbaseTableProperty" required="true" type="string">hbase.mapred.datatable</PARAM> |
|
150 |
<PARAM managedBy="system" name="cluster" required="true" type="string">DM</PARAM> |
|
151 |
<PARAM managedBy="user" name="mapping" required="true" type="string" function="obtainValues('dbmf2hbaseMappings', {})"></PARAM> |
|
152 |
</PARAMETERS> |
|
153 |
<ARCS> |
|
154 |
<ARC to="success"/> |
|
155 |
</ARCS> |
|
156 |
</NODE> |
|
157 |
</CONFIGURATION> |
|
158 |
<STATUS> |
|
159 |
<LAST_EXECUTION_ID>wf_20140509_125739_830</LAST_EXECUTION_ID> |
|
160 |
<LAST_EXECUTION_DATE>2014-05-09T13:03:16+02:00</LAST_EXECUTION_DATE> |
|
161 |
<LAST_EXECUTION_STATUS>SUCCESS</LAST_EXECUTION_STATUS> |
|
162 |
<LAST_EXECUTION_ERROR/> |
|
163 |
<LAST_EXECUTION_OUTPUT name=""></LAST_EXECUTION_OUTPUT> |
|
164 |
</STATUS> |
|
165 |
</BODY> |
|
166 |
</RESOURCE_PROFILE> |
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/hbase/oaf2hbase.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER |
|
5 |
value="c7d7d775-2db3-474d-85ab-5173a582d515_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
6 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
7 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
8 |
<RESOURCE_URI value=""/> |
|
9 |
<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z"/> |
|
10 |
</HEADER> |
|
11 |
<BODY> |
|
12 |
<WORKFLOW_NAME>OAF to HBase</WORKFLOW_NAME> |
|
13 |
<WORKFLOW_TYPE>Data Load</WORKFLOW_TYPE> |
|
14 |
<WORKFLOW_PRIORITY>30</WORKFLOW_PRIORITY> |
|
15 |
<CONFIGURATION start="manual"> |
|
16 |
<NODE name="prepareImport" type="PrepareMDStoreImport" isStart="true"> |
|
17 |
<DESCRIPTION>Configure export to HDFS</DESCRIPTION> |
|
18 |
<PARAMETERS> |
|
19 |
<PARAM required="true" type="string" name="hdfsPathParam" managedBy="system">hdfsPath</PARAM> |
|
20 |
<PARAM required="true" type="string" name="hdfsPath" managedBy="system">/tmp/mdstores_oaf-store-cleaned.seq</PARAM> |
|
21 |
<PARAM required="true" type="string" name="xsltParam" managedBy="system">xslt</PARAM> |
|
22 |
<PARAM required="true" type="string" name="xslt" managedBy="system">/eu/dnetlib/data/transform/dmf_2_hbase.xsl</PARAM> |
|
23 |
</PARAMETERS> |
|
24 |
<ARCS> |
|
25 |
<ARC to="reuseHdfsRecords"/> |
|
26 |
</ARCS> |
|
27 |
</NODE> |
|
28 |
<NODE name="reuseHdfsRecords" type="ReuseHdfsRecords"> |
|
29 |
<DESCRIPTION>reuse mdstore records</DESCRIPTION> |
|
30 |
<PARAMETERS> |
|
31 |
<PARAM required="true" type="boolean" name="reuseMdRecords" managedBy="user">false</PARAM> |
|
32 |
</PARAMETERS> |
|
33 |
<ARCS> |
|
34 |
<ARC name="true" to="mapreduce"/> |
|
35 |
<ARC name="false" to="exportRecords"/> |
|
36 |
</ARCS> |
|
37 |
</NODE> |
|
38 |
<NODE name="exportRecords" type="MDStoreBatchExporter"> |
|
39 |
<DESCRIPTION>Fetch mdstore records</DESCRIPTION> |
|
40 |
<PARAMETERS> |
|
41 |
<PARAM required="true" type="string" name="format" managedBy="system">OAF</PARAM> |
|
42 |
<PARAM required="true" type="string" name="layout" managedBy="system">store</PARAM> |
|
43 |
<PARAM required="true" type="string" name="interpretation" managedBy="system">cleaned</PARAM> |
|
44 |
<PARAM required="true" type="string" name="outputEprParam" managedBy="system">records_epr</PARAM> |
|
45 |
</PARAMETERS> |
|
46 |
<ARCS> |
|
47 |
<ARC to="storeHdfsRecords"/> |
|
48 |
</ARCS> |
|
49 |
</NODE> |
|
50 |
<NODE name="storeHdfsRecords" type="StoreHdfsRecords"> |
|
51 |
<DESCRIPTION>Store records to HDFS</DESCRIPTION> |
|
52 |
<PARAMETERS> |
|
53 |
<PARAM required="true" type="string" name="inputEprParam" managedBy="system">records_epr</PARAM> |
|
54 |
<PARAM required="true" type="string" name="hdfsPathParam" managedBy="system">hdfsPath</PARAM> |
|
55 |
<PARAM required="true" type="string" name="cluster" managedBy="system">DM</PARAM> |
|
56 |
</PARAMETERS> |
|
57 |
<ARCS> |
|
58 |
<ARC to="mapreduce"/> |
|
59 |
</ARCS> |
|
60 |
</NODE> |
|
61 |
<NODE name="mapreduce" type="SubmitHadoopJob"> |
|
62 |
<DESCRIPTION>Run M/R import Job</DESCRIPTION> |
|
63 |
<PARAMETERS> |
|
64 |
<PARAM required="true" type="string" name="cluster" managedBy="system">DM</PARAM> |
|
65 |
<PARAM required="true" type="string" name="hadoopJob" managedBy="system">mdStoreHdfsImportJob</PARAM> |
|
66 |
<PARAM required="true" type="string" name="envParams" managedBy="system"> |
|
67 |
{ |
|
68 |
'mapred.input.dir' : 'hdfsPath', |
|
69 |
'hbase.import.xslt' : 'xslt' |
|
70 |
} |
|
71 |
</PARAM> |
|
72 |
<PARAM required="true" type="string" name="sysParams" managedBy="system"> |
|
73 |
{ |
|
74 |
'hbase.mapred.outputtable' : 'hbase.mapred.datatable' |
|
75 |
} |
|
76 |
</PARAM> |
|
77 |
<PARAM required="true" type="boolean" name="simulation" managedBy="user">false</PARAM> |
|
78 |
</PARAMETERS> |
|
79 |
<ARCS> |
|
80 |
<ARC to="success"/> |
|
81 |
</ARCS> |
|
82 |
</NODE> |
|
83 |
</CONFIGURATION> |
|
84 |
<STATUS/> |
|
85 |
</BODY> |
|
86 |
</RESOURCE_PROFILE> |
|
87 |
|
|
88 |
|
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/repo-hi/Aggregate_Metadata_from_AggregatorPubsRepository_Support.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER |
|
5 |
value="1d5cb1ba-ec09-445c-9f9e-1db35b14700f_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
6 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
7 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
8 |
<RESOURCE_URI value=""/> |
|
9 |
<DATE_OF_CREATION value="2015-12-11T15:43:51.0Z"/> |
|
10 |
</HEADER> |
|
11 |
<BODY> |
|
12 |
<WORKFLOW_NAME>Aggregate Metadata (publications) from Aggregator::PubsRepository [Support]</WORKFLOW_NAME> |
|
13 |
<WORKFLOW_INFO> |
|
14 |
<FIELD name="Action">Aggregate Metadata</FIELD> |
|
15 |
<FIELD name="Consequence IS">Support</FIELD> |
|
16 |
<FIELD name="Datasource class">Aggregator::PubsRepository</FIELD> |
|
17 |
<FIELD name="Content">publications</FIELD> |
|
18 |
</WORKFLOW_INFO> |
|
19 |
<WORKFLOW_TYPE>REPO_HI</WORKFLOW_TYPE> |
|
20 |
<WORKFLOW_PRIORITY>20</WORKFLOW_PRIORITY> |
|
21 |
<CONFIGURATION start="manual"> |
|
22 |
<NODE name="VerifyDatasource" type="VerifyDatasource" isStart="true"> |
|
23 |
<DESCRIPTION>Verify if DS is pending</DESCRIPTION> |
|
24 |
<PARAMETERS> |
|
25 |
<PARAM name="expectedInterfaceTypologyPrefixes" managedBy="system" required="false" type="string">aggregator::pubsrepository,pubscatalogue |
|
26 |
</PARAM> |
|
27 |
<PARAM name="expectedCompliancePrefixes" managedBy="system" required="false" type="string"></PARAM> |
|
28 |
</PARAMETERS> |
|
29 |
<ARCS> |
|
30 |
<ARC to="createMetaWf"/> |
|
31 |
<ARC to="validateDs" name="validateDs"/> |
|
32 |
</ARCS> |
|
33 |
</NODE> |
|
34 |
|
|
35 |
<NODE name="validateDs" type="ValidateDatasource"> |
|
36 |
<DESCRIPTION>Validate DS</DESCRIPTION> |
|
37 |
<PARAMETERS/> |
|
38 |
<ARCS> |
|
39 |
<ARC to="createMetaWf"/> |
|
40 |
</ARCS> |
|
41 |
</NODE> |
|
42 |
|
|
43 |
<NODE name="createMetaWf" type="RegisterMetaWf"> |
|
44 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
45 |
<PARAMETERS> |
|
46 |
<PARAM name="wfName" managedBy="system" required="true" |
|
47 |
type="string">Aggregate Metadata (publications) from Aggregator::PubsRepository [Support] |
|
48 |
</PARAM> |
|
49 |
</PARAMETERS> |
|
50 |
<ARCS> |
|
51 |
<ARC to="createDc"/> |
|
52 |
<ARC to="createOaf"/> |
|
53 |
</ARCS> |
|
54 |
</NODE> |
|
55 |
|
|
56 |
<NODE name="createDc" type="CreateMDStore"> |
|
57 |
<DESCRIPTION>Create oai_dc store</DESCRIPTION> |
|
58 |
<PARAMETERS> |
|
59 |
<PARAM name="format" managedBy="system" required="true" type="string">oai_dc</PARAM> |
|
60 |
<PARAM name="interpretation" managedBy="system" required="true" type="string">nativesupport</PARAM> |
|
61 |
<PARAM name="layout" managedBy="system" required="true" type="string">store</PARAM> |
|
62 |
<PARAM name="outputPrefix" managedBy="system" required="true" type="string">harv_</PARAM> |
|
63 |
</PARAMETERS> |
|
64 |
<ARCS> |
|
65 |
<ARC to="updateMetaWf"/> |
|
66 |
</ARCS> |
|
67 |
</NODE> |
|
68 |
<NODE name="createOaf" type="CreateMDStore"> |
|
69 |
<DESCRIPTION>Create OAF store</DESCRIPTION> |
|
70 |
<PARAMETERS> |
|
71 |
<PARAM name="format" managedBy="system" required="true" type="string">OAF</PARAM> |
|
72 |
<PARAM name="interpretation" managedBy="system" required="true" type="string">cleanedsupport</PARAM> |
|
73 |
<PARAM name="layout" managedBy="system" required="true" type="string">store</PARAM> |
|
74 |
<PARAM name="outputPrefix" managedBy="system" required="true" type="string">tran_</PARAM> |
|
75 |
</PARAMETERS> |
|
76 |
<ARCS> |
|
77 |
<ARC to="updateMetaWf"/> |
|
78 |
</ARCS> |
|
79 |
</NODE> |
|
80 |
|
|
81 |
<NODE name="updateMetaWf" type="UpdateMetaWf" isJoin="true"> |
|
82 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
83 |
<PARAMETERS> |
|
84 |
<PARAM name="beanName" managedBy="system" required="true" type="string">metaWfAggregatorPubsRepositoryIngestion</PARAM> |
|
85 |
</PARAMETERS> |
|
86 |
<ARCS> |
|
87 |
<ARC to="updateMetaWfStatus"/> |
|
88 |
</ARCS> |
|
89 |
</NODE> |
|
90 |
|
|
91 |
<NODE name="updateMetaWfStatus" type="UpdateOpenaireMetaWfStatus"> |
|
92 |
<DESCRIPTION>Update MetaWorkflow Status</DESCRIPTION> |
|
93 |
<PARAMETERS/> |
|
94 |
<ARCS> |
|
95 |
<ARC to="success"/> |
|
96 |
</ARCS> |
|
97 |
</NODE> |
|
98 |
</CONFIGURATION> |
|
99 |
|
|
100 |
<STATUS/> |
|
101 |
</BODY> |
|
102 |
</RESOURCE_PROFILE> |
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/repo-hi/Aggregate_Metadata_from_EntityRegistry_Native.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER |
|
5 |
value="e477ca5a-1c2b-419e-93f2-c843aa533581_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
6 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
7 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
8 |
<RESOURCE_URI value="value3"/> |
|
9 |
<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z"/> |
|
10 |
</HEADER> |
|
11 |
<BODY> |
|
12 |
<WORKFLOW_NAME>Aggregate Metadata (datasource, organization and person entities) [Ingestion]</WORKFLOW_NAME> |
|
13 |
<WORKFLOW_INFO> |
|
14 |
<FIELD name="Action">Aggregate Metadata</FIELD> |
|
15 |
<FIELD name="Consequence IS">Ingestion</FIELD> |
|
16 |
<FIELD name="Datasource class">EntityRegistry, Aggregator</FIELD> |
|
17 |
<FIELD name="Content">datasource, organization and person entities</FIELD> |
|
18 |
</WORKFLOW_INFO> |
|
19 |
<WORKFLOW_TYPE>REPO_HI</WORKFLOW_TYPE> |
|
20 |
<WORKFLOW_PRIORITY>20</WORKFLOW_PRIORITY> |
|
21 |
<CONFIGURATION start="manual"> |
|
22 |
<NODE name="VerifyDatasource" type="VerifyDatasource" isStart="true"> |
|
23 |
<DESCRIPTION>Verify if DS is pending</DESCRIPTION> |
|
24 |
<PARAMETERS> |
|
25 |
<PARAM name="expectedInterfaceTypologyPrefixes" managedBy="system" required="false" type="string">entityregistry::repositories,aggregator::pubsrepository</PARAM> |
|
26 |
<PARAM name="expectedCompliancePrefixes" managedBy="system" required="false" type="string">native</PARAM> |
|
27 |
</PARAMETERS> |
|
28 |
<ARCS> |
|
29 |
<ARC to="createMetaWf"/> |
|
30 |
<ARC to="validateDs" name="validateDs"/> |
|
31 |
</ARCS> |
|
32 |
</NODE> |
|
33 |
|
|
34 |
<NODE name="validateDs" type="ValidateDatasource"> |
|
35 |
<DESCRIPTION>Validate DS</DESCRIPTION> |
|
36 |
<PARAMETERS/> |
|
37 |
<ARCS> |
|
38 |
<ARC to="createMetaWf"/> |
|
39 |
</ARCS> |
|
40 |
</NODE> |
|
41 |
|
|
42 |
<NODE name="createMetaWf" type="RegisterMetaWf"> |
|
43 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
44 |
<PARAMETERS> |
|
45 |
<PARAM name="wfName" managedBy="system" required="true" type="string">Aggregate Metadata (datasource, organization and person entities) [Ingestion]</PARAM> |
|
46 |
</PARAMETERS> |
|
47 |
<ARCS> |
|
48 |
<ARC to="createGMF"/> |
|
49 |
<ARC to="createDBMF"/> |
|
50 |
</ARCS> |
|
51 |
</NODE> |
|
52 |
|
|
53 |
<NODE name="createGMF" type="CreateMDStore"> |
|
54 |
<DESCRIPTION>Create store for native records</DESCRIPTION> |
|
55 |
<PARAMETERS> |
|
56 |
<PARAM name="format" managedBy="system" required="true" type="string">GMF</PARAM> |
|
57 |
<PARAM name="interpretation" managedBy="system" required="true" type="string">native</PARAM> |
|
58 |
<PARAM name="layout" managedBy="system" required="true" type="string">store</PARAM> |
|
59 |
<PARAM name="outputPrefix" managedBy="system" required="true" type="string">orig_</PARAM> |
|
60 |
</PARAMETERS> |
|
61 |
<ARCS> |
|
62 |
<ARC to="updateMetaWf"/> |
|
63 |
</ARCS> |
|
64 |
</NODE> |
|
65 |
<NODE name="createDBMF" type="CreateMDStore"> |
|
66 |
<DESCRIPTION>Create store for DB rows</DESCRIPTION> |
|
67 |
<PARAMETERS> |
|
68 |
<PARAM name="format" managedBy="system" required="true" type="string">DBMF</PARAM> |
|
69 |
<PARAM name="interpretation" managedBy="system" required="true" type="string">cleaned</PARAM> |
|
70 |
<PARAM name="layout" managedBy="system" required="true" type="string">store</PARAM> |
|
71 |
<PARAM name="outputPrefix" managedBy="system" required="true" type="string">row_</PARAM> |
|
72 |
</PARAMETERS> |
|
73 |
<ARCS> |
|
74 |
<ARC to="updateMetaWf"/> |
|
75 |
</ARCS> |
|
76 |
</NODE> |
|
77 |
|
|
78 |
<NODE name="updateMetaWf" type="UpdateMetaWf" isJoin="true"> |
|
79 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
80 |
<PARAMETERS> |
|
81 |
<PARAM name="beanName" managedBy="system" required="true" type="string">metaWfEntityRegDatasource</PARAM> |
|
82 |
</PARAMETERS> |
|
83 |
<ARCS> |
|
84 |
<ARC to="updateMetaWfStatus"/> |
|
85 |
</ARCS> |
|
86 |
</NODE> |
|
87 |
|
|
88 |
<NODE name="updateMetaWfStatus" type="UpdateOpenaireMetaWfStatus"> |
|
89 |
<DESCRIPTION>Update MetaWorkflow Status</DESCRIPTION> |
|
90 |
<PARAMETERS/> |
|
91 |
<ARCS> |
|
92 |
<ARC to="success"/> |
|
93 |
</ARCS> |
|
94 |
</NODE> |
|
95 |
</CONFIGURATION> |
|
96 |
|
|
97 |
<STATUS/> |
|
98 |
</BODY> |
|
99 |
</RESOURCE_PROFILE> |
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/repo-hi/Download_files_from_PubsRepository.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER |
|
5 |
value="e08d993f-6349-4ca8-b7b6-e76914101712_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
6 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
7 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
8 |
<RESOURCE_URI value="value3"/> |
|
9 |
<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z"/> |
|
10 |
</HEADER> |
|
11 |
<BODY> |
|
12 |
<WORKFLOW_NAME>Download Files (files) from PubsRepository [Inference]</WORKFLOW_NAME> |
|
13 |
<WORKFLOW_INFO> |
|
14 |
<FIELD name="Action">Download Files</FIELD> |
|
15 |
<FIELD name="Consequence IS">Inference</FIELD> |
|
16 |
<FIELD name="Datasource class">PubsRepository</FIELD> |
|
17 |
<FIELD name="Content">files</FIELD> |
|
18 |
</WORKFLOW_INFO> |
|
19 |
<WORKFLOW_TYPE>REPO_HI</WORKFLOW_TYPE> |
|
20 |
<WORKFLOW_PRIORITY>20</WORKFLOW_PRIORITY> |
|
21 |
<CONFIGURATION start="manual"> |
|
22 |
<NODE name="VerifyDatasource" type="VerifyDatasource" isStart="true"> |
|
23 |
<DESCRIPTION>Verify if DS is pending</DESCRIPTION> |
|
24 |
<PARAMETERS> |
|
25 |
<PARAM name="expectedInterfaceTypologyPrefixes" managedBy="system" |
|
26 |
required="false" type="string">pubsrepository, aggregator::pubsrepository |
|
27 |
</PARAM> |
|
28 |
<PARAM name="expectedCompliancePrefixes" managedBy="system" |
|
29 |
required="false" type="string">files |
|
30 |
</PARAM> |
|
31 |
</PARAMETERS> |
|
32 |
<ARCS> |
|
33 |
<ARC to="RetreiveInterfaceInfo"/> |
|
34 |
<ARC to="validateDs" name="validateDs"/> |
|
35 |
</ARCS> |
|
36 |
</NODE> |
|
37 |
|
|
38 |
<NODE name="validateDs" type="ValidateDatasource"> |
|
39 |
<DESCRIPTION>Validate DS</DESCRIPTION> |
|
40 |
<PARAMETERS/> |
|
41 |
<ARCS> |
|
42 |
<ARC to="RetreiveInterfaceInfo"/> |
|
43 |
</ARCS> |
|
44 |
</NODE> |
|
45 |
<NODE name="RetreiveInterfaceInfo" type="RetreiveInterfaceInfo"> |
|
46 |
<DESCRIPTION>Retreive Interface Info</DESCRIPTION> |
|
47 |
<PARAMETERS/> |
|
48 |
<ARCS> |
|
49 |
<ARC to="createMetaWf"/> |
|
50 |
</ARCS> |
|
51 |
</NODE> |
|
52 |
|
|
53 |
<NODE name="createMetaWf" type="RegisterMetaWf"> |
|
54 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
55 |
<PARAMETERS> |
|
56 |
<PARAM name="wfName" managedBy="system" required="true" type="string">Download Files (files) from PubsRepository [Inference]</PARAM> |
|
57 |
<PARAM name="adminEmail" managedBy="system" required="false" type="string">openaire-fulltexts@openaire.eu</PARAM> |
|
58 |
</PARAMETERS> |
|
59 |
<ARCS> |
|
60 |
<ARC to="createObjectStore"/> |
|
61 |
</ARCS> |
|
62 |
</NODE> |
|
63 |
<NODE name="createObjectStore" type="CreateObjectStore"> |
|
64 |
<DESCRIPTION>Create Object store</DESCRIPTION> |
|
65 |
<PARAMETERS> |
|
66 |
<PARAM name="interpretation" managedBy="system" required="true" |
|
67 |
type="string">pubrepository record |
|
68 |
</PARAM> |
|
69 |
<PARAM name="outputPrefix" managedBy="system" required="true" |
|
70 |
type="string">objs_ |
|
71 |
</PARAM> |
|
72 |
</PARAMETERS> |
|
73 |
<ARCS> |
|
74 |
<ARC to="updateMetaWf"/> |
|
75 |
</ARCS> |
|
76 |
</NODE> |
|
77 |
|
|
78 |
<NODE name="updateMetaWf" type="UpdateMetaWf" isJoin="true"> |
|
79 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
80 |
<PARAMETERS> |
|
81 |
<PARAM name="beanName" managedBy="system" required="true" |
|
82 |
type="string">metaWfPubRepositoryFiles |
|
83 |
</PARAM> |
|
84 |
</PARAMETERS> |
|
85 |
<ARCS> |
|
86 |
<ARC to="updateMetaWfStatus"/> |
|
87 |
</ARCS> |
|
88 |
</NODE> |
|
89 |
|
|
90 |
<NODE name="updateMetaWfStatus" type="UpdateOpenaireMetaWfStatus"> |
|
91 |
<DESCRIPTION>Update MetaWorkflow Status</DESCRIPTION> |
|
92 |
<PARAMETERS/> |
|
93 |
<ARCS> |
|
94 |
<ARC to="success"/> |
|
95 |
</ARCS> |
|
96 |
</NODE> |
|
97 |
</CONFIGURATION> |
|
98 |
|
|
99 |
<STATUS/> |
|
100 |
</BODY> |
|
101 |
</RESOURCE_PROFILE> |
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/repo-hi/Fill_HostedbyMap_journal_intersection.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER |
|
5 |
value="2ffee4a5-2f5a-40b3-9e49-e4caab7784f4_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
6 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
7 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
8 |
<RESOURCE_URI value="value3"/> |
|
9 |
<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z"/> |
|
10 |
</HEADER> |
|
11 |
<BODY> |
|
12 |
<WORKFLOW_NAME>Fill hostedBy-Map (ISSNs in DOAJ) from PANGAEA [Context]</WORKFLOW_NAME> |
|
13 |
<WORKFLOW_INFO> |
|
14 |
<FIELD name="Action">Fill hostedBy-Map</FIELD> |
|
15 |
<FIELD name="Consequence IS">Context</FIELD> |
|
16 |
<FIELD name="Datasource class">PANGAEA</FIELD> |
|
17 |
<FIELD name="Content">ISSNs</FIELD> |
|
18 |
</WORKFLOW_INFO> |
|
19 |
<WORKFLOW_TYPE>REPO_HI</WORKFLOW_TYPE> |
|
20 |
<WORKFLOW_PRIORITY>20</WORKFLOW_PRIORITY> |
|
21 |
<CONFIGURATION start="manual"> |
|
22 |
<NODE name="VerifyDatasource" type="VerifyDatasource" isStart="true"> |
|
23 |
<DESCRIPTION>Verify if DS is pending</DESCRIPTION> |
|
24 |
<PARAMETERS> |
|
25 |
<PARAM name="expectedInterfaceTypologyPrefixes" managedBy="system" required="false" type="string">datarepository::unknown</PARAM> |
|
26 |
<PARAM name="expectedCompliancePrefixes" managedBy="system" required="false" type="string">native</PARAM> |
|
27 |
</PARAMETERS> |
|
28 |
<ARCS> |
|
29 |
<ARC to="createMetaWf"/> |
|
30 |
<ARC to="validateDs" name="validateDs"/> |
|
31 |
</ARCS> |
|
32 |
</NODE> |
|
33 |
|
|
34 |
<NODE name="validateDs" type="ValidateDatasource"> |
|
35 |
<DESCRIPTION>Validate DS</DESCRIPTION> |
|
36 |
<PARAMETERS/> |
|
37 |
<ARCS> |
|
38 |
<ARC to="createMetaWf"/> |
|
39 |
</ARCS> |
|
40 |
</NODE> |
|
41 |
|
|
42 |
<NODE name="createMetaWf" type="RegisterMetaWf"> |
|
43 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
44 |
<PARAMETERS> |
|
45 |
<PARAM name="wfName" managedBy="system" required="true" type="string">Fill hostedBy-Map (ISSNs in DOAJ) from PANGAEA [Context]</PARAM> |
|
46 |
</PARAMETERS> |
|
47 |
<ARCS> |
|
48 |
<ARC to="updateMetaWf"/> |
|
49 |
</ARCS> |
|
50 |
</NODE> |
|
51 |
|
|
52 |
<NODE name="updateMetaWf" type="UpdateMetaWf"> |
|
53 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
54 |
<PARAMETERS> |
|
55 |
<PARAM name="beanName" managedBy="system" required="true" type="string">metaWfHostedByMapJournalIntersection</PARAM> |
|
56 |
</PARAMETERS> |
|
57 |
<ARCS> |
|
58 |
<ARC to="updateMetaWfStatus"/> |
|
59 |
</ARCS> |
|
60 |
</NODE> |
|
61 |
|
|
62 |
<NODE name="updateMetaWfStatus" type="UpdateOpenaireMetaWfStatus"> |
|
63 |
<DESCRIPTION>Update MetaWorkflow Status</DESCRIPTION> |
|
64 |
<PARAMETERS/> |
|
65 |
<ARCS> |
|
66 |
<ARC to="success"/> |
|
67 |
</ARCS> |
|
68 |
</NODE> |
|
69 |
</CONFIGURATION> |
|
70 |
<STATUS/> |
|
71 |
</BODY> |
|
72 |
</RESOURCE_PROFILE> |
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/repo-hi/Fill_HostedbyMap_oaisets.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER |
|
5 |
value="24e64dae-9990-45a3-a209-61bccfb3ef1e_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
6 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
7 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
8 |
<RESOURCE_URI value="value3"/> |
|
9 |
<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z"/> |
|
10 |
</HEADER> |
|
11 |
<BODY> |
|
12 |
<WORKFLOW_NAME>Fill hostedBy-Map (OAI-PMH sets in DataRepositories) from DataCite [Context]</WORKFLOW_NAME> |
|
13 |
<WORKFLOW_INFO> |
|
14 |
<FIELD name="Action">Fill hostedBy-Map</FIELD> |
|
15 |
<FIELD name="Consequence IS">Context</FIELD> |
|
16 |
<FIELD name="Datasource class">DataCite</FIELD> |
|
17 |
<FIELD name="Content">OAI-PMH sets in DataRepositories</FIELD> |
|
18 |
</WORKFLOW_INFO> |
|
19 |
<WORKFLOW_TYPE>REPO_HI</WORKFLOW_TYPE> |
|
20 |
<WORKFLOW_PRIORITY>20</WORKFLOW_PRIORITY> |
|
21 |
<CONFIGURATION start="manual"> |
|
22 |
<NODE name="VerifyDatasource" type="VerifyDatasource" isStart="true"> |
|
23 |
<DESCRIPTION>Verify if DS is pending</DESCRIPTION> |
|
24 |
<PARAMETERS> |
|
25 |
<PARAM name="expectedInterfaceTypologyPrefixes" managedBy="system" required="false" type="string">aggregator::datarepository</PARAM> |
|
26 |
<PARAM name="expectedCompliancePrefixes" managedBy="system" required="false" type="string">native</PARAM> |
|
27 |
</PARAMETERS> |
|
28 |
<ARCS> |
|
29 |
<ARC to="createMetaWf"/> |
|
30 |
<ARC to="validateDs" name="validateDs"/> |
|
31 |
</ARCS> |
|
32 |
</NODE> |
|
33 |
|
|
34 |
<NODE name="validateDs" type="ValidateDatasource"> |
|
35 |
<DESCRIPTION>Validate DS</DESCRIPTION> |
|
36 |
<PARAMETERS/> |
|
37 |
<ARCS> |
|
38 |
<ARC to="createMetaWf"/> |
|
39 |
</ARCS> |
|
40 |
</NODE> |
|
41 |
|
|
42 |
<NODE name="createMetaWf" type="RegisterMetaWf"> |
|
43 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
44 |
<PARAMETERS> |
|
45 |
<PARAM name="wfName" managedBy="system" required="true" type="string">Fill hostedBy-Map (OAI-PMH sets in DataRepositories) from DataCite [Context]</PARAM> |
|
46 |
</PARAMETERS> |
|
47 |
<ARCS> |
|
48 |
<ARC to="createGMF"/> |
|
49 |
<ARC to="createDBMF"/> |
|
50 |
</ARCS> |
|
51 |
</NODE> |
|
52 |
|
|
53 |
<NODE name="createGMF" type="CreateMDStore"> |
|
54 |
<DESCRIPTION>Create store for native records</DESCRIPTION> |
|
55 |
<PARAMETERS> |
|
56 |
<PARAM name="format" managedBy="system" required="true" type="string">GMF</PARAM> |
|
57 |
<PARAM name="interpretation" managedBy="system" required="true" type="string">native</PARAM> |
|
58 |
<PARAM name="layout" managedBy="system" required="true" type="string">store</PARAM> |
|
59 |
<PARAM name="outputPrefix" managedBy="system" required="true" type="string">orig_</PARAM> |
|
60 |
</PARAMETERS> |
|
61 |
<ARCS> |
|
62 |
<ARC to="updateMetaWf"/> |
|
63 |
</ARCS> |
|
64 |
</NODE> |
|
65 |
<NODE name="createDBMF" type="CreateMDStore"> |
|
66 |
<DESCRIPTION>Create store for DB rows</DESCRIPTION> |
|
67 |
<PARAMETERS> |
|
68 |
<PARAM name="format" managedBy="system" required="true" type="string">DBMF</PARAM> |
|
69 |
<PARAM name="interpretation" managedBy="system" required="true" type="string">cleaned</PARAM> |
|
70 |
<PARAM name="layout" managedBy="system" required="true" type="string">store</PARAM> |
|
71 |
<PARAM name="outputPrefix" managedBy="system" required="true" type="string">row_</PARAM> |
|
72 |
</PARAMETERS> |
|
73 |
<ARCS> |
|
74 |
<ARC to="updateMetaWf"/> |
|
75 |
</ARCS> |
|
76 |
</NODE> |
|
77 |
|
|
78 |
<NODE name="updateMetaWf" type="UpdateMetaWf" isJoin="true"> |
|
79 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
80 |
<PARAMETERS> |
|
81 |
<PARAM name="beanName" managedBy="system" required="true" type="string">metaWfAggrDatarepoOaiSets</PARAM> |
|
82 |
</PARAMETERS> |
|
83 |
<ARCS> |
|
84 |
<ARC to="updateMetaWfStatus"/> |
|
85 |
</ARCS> |
|
86 |
</NODE> |
|
87 |
|
|
88 |
<NODE name="updateMetaWfStatus" type="UpdateOpenaireMetaWfStatus"> |
|
89 |
<DESCRIPTION>Update MetaWorkflow Status</DESCRIPTION> |
|
90 |
<PARAMETERS/> |
|
91 |
<ARCS> |
|
92 |
<ARC to="success"/> |
|
93 |
</ARCS> |
|
94 |
</NODE> |
|
95 |
</CONFIGURATION> |
|
96 |
|
|
97 |
<STATUS/> |
|
98 |
</BODY> |
|
99 |
</RESOURCE_PROFILE> |
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/repo-hi/Aggregate_Metadata_from_CordaH2020Projects_Native.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER |
|
5 |
value="5c2abfcc-4f0c-4229-aa42-75ac8bac3b68_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
6 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
7 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
8 |
<RESOURCE_URI value="value3"/> |
|
9 |
<DATE_OF_CREATION value="2017-02-28T18:13:51.0Z"/> |
|
10 |
</HEADER> |
|
11 |
<BODY> |
|
12 |
<WORKFLOW_NAME>EC H2020 Aggregate Projects, Fundings and Contexts [Ingestion]</WORKFLOW_NAME> |
|
13 |
<WORKFLOW_INFO> |
|
14 |
<FIELD name="Action">Aggregate Metadata</FIELD> |
|
15 |
<FIELD name="Consequence IS">Ingestion</FIELD> |
|
16 |
<FIELD name="Datasource class">EntityRegistry</FIELD> |
|
17 |
<FIELD name="Content">project, organization, person, funding, context</FIELD> |
|
18 |
</WORKFLOW_INFO> |
|
19 |
<WORKFLOW_TYPE>REPO_HI</WORKFLOW_TYPE> |
|
20 |
<WORKFLOW_PRIORITY>20</WORKFLOW_PRIORITY> |
|
21 |
<CONFIGURATION start="manual"> |
|
22 |
<NODE name="VerifyDatasource" type="VerifyDatasource" isStart="true"> |
|
23 |
<DESCRIPTION>Verify if DS is pending</DESCRIPTION> |
|
24 |
<PARAMETERS> |
|
25 |
<PARAM name="expectedInterfaceTypologyPrefixes" managedBy="system" required="false" type="string">entityregistry::projects</PARAM> |
|
26 |
<PARAM name="expectedCompliancePrefixes" managedBy="system" required="false" type="string">native</PARAM> |
|
27 |
</PARAMETERS> |
|
28 |
<ARCS> |
|
29 |
<ARC to="createMetaWf"/> |
|
30 |
<ARC to="validateDs" name="validateDs"/> |
|
31 |
</ARCS> |
|
32 |
</NODE> |
|
33 |
|
|
34 |
<NODE name="validateDs" type="ValidateDatasource"> |
|
35 |
<DESCRIPTION>Validate DS</DESCRIPTION> |
|
36 |
<PARAMETERS/> |
|
37 |
<ARCS> |
|
38 |
<ARC to="createMetaWf"/> |
|
39 |
</ARCS> |
|
40 |
</NODE> |
|
41 |
|
|
42 |
<NODE name="createMetaWf" type="RegisterMetaWf"> |
|
43 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
44 |
<PARAMETERS> |
|
45 |
<PARAM name="wfName" managedBy="system" required="true" type="string">EC H2020 Aggregate Projects, Fundings and Contexts [Ingestion]</PARAM> |
|
46 |
</PARAMETERS> |
|
47 |
<ARCS> |
|
48 |
<ARC to="createGMF"/> |
|
49 |
<ARC to="createDBMF"/> |
|
50 |
</ARCS> |
|
51 |
</NODE> |
|
52 |
|
|
53 |
<NODE name="createGMF" type="CreateMDStore"> |
|
54 |
<DESCRIPTION>Create store for native records</DESCRIPTION> |
|
55 |
<PARAMETERS> |
|
56 |
<PARAM name="format" managedBy="system" required="true" type="string">GMF</PARAM> |
|
57 |
<PARAM name="interpretation" managedBy="system" required="true" type="string">native</PARAM> |
|
58 |
<PARAM name="layout" managedBy="system" required="true" type="string">store</PARAM> |
|
59 |
<PARAM name="outputPrefix" managedBy="system" required="true" type="string">orig_</PARAM> |
|
60 |
</PARAMETERS> |
|
61 |
<ARCS> |
|
62 |
<ARC to="updateMetaWf"/> |
|
63 |
</ARCS> |
|
64 |
</NODE> |
|
65 |
<NODE name="createDBMF" type="CreateMDStore"> |
|
66 |
<DESCRIPTION>Create store for DB rows</DESCRIPTION> |
|
67 |
<PARAMETERS> |
|
68 |
<PARAM name="format" managedBy="system" required="true" type="string">DBMF</PARAM> |
|
69 |
<PARAM name="interpretation" managedBy="system" required="true" type="string">cleaned</PARAM> |
|
70 |
<PARAM name="layout" managedBy="system" required="true" type="string">store</PARAM> |
|
71 |
<PARAM name="outputPrefix" managedBy="system" required="true" type="string">row_</PARAM> |
|
72 |
</PARAMETERS> |
|
73 |
<ARCS> |
|
74 |
<ARC to="updateMetaWf"/> |
|
75 |
</ARCS> |
|
76 |
</NODE> |
|
77 |
|
|
78 |
<NODE name="updateMetaWf" type="UpdateMetaWf" isJoin="true"> |
|
79 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
80 |
<PARAMETERS> |
|
81 |
<PARAM name="beanName" managedBy="system" required="true" type="string">metaWfH2020Projects</PARAM> |
|
82 |
</PARAMETERS> |
|
83 |
<ARCS> |
|
84 |
<ARC to="updateMetaWfStatus"/> |
|
85 |
</ARCS> |
|
86 |
</NODE> |
|
87 |
|
|
88 |
<NODE name="updateMetaWfStatus" type="UpdateOpenaireMetaWfStatus"> |
|
89 |
<DESCRIPTION>Update MetaWorkflow Status</DESCRIPTION> |
|
90 |
<PARAMETERS/> |
|
91 |
<ARCS> |
|
92 |
<ARC to="success"/> |
|
93 |
</ARCS> |
|
94 |
</NODE> |
|
95 |
</CONFIGURATION> |
|
96 |
|
|
97 |
<STATUS/> |
|
98 |
</BODY> |
|
99 |
</RESOURCE_PROFILE> |
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/repo-hi/Aggregate_Metadata_from_EntityRegistryProjects_Native.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER |
|
5 |
value="a720c644-0c03-4c5d-b94d-503ea9f42b1b_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
6 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
7 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
8 |
<RESOURCE_URI value="value3"/> |
|
9 |
<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z"/> |
|
10 |
</HEADER> |
|
11 |
<BODY> |
|
12 |
<WORKFLOW_NAME>Aggregate Projects, Fundings and Contextes [Ingestion]</WORKFLOW_NAME> |
|
13 |
<WORKFLOW_INFO> |
|
14 |
<FIELD name="Action">Aggregate Metadata</FIELD> |
|
15 |
<FIELD name="Consequence IS">Ingestion</FIELD> |
|
16 |
<FIELD name="Datasource class">EntityRegistry, Aggregator</FIELD> |
|
17 |
<FIELD name="Content">project, organization, person, funding, context</FIELD> |
|
18 |
</WORKFLOW_INFO> |
|
19 |
<WORKFLOW_TYPE>REPO_HI</WORKFLOW_TYPE> |
|
20 |
<WORKFLOW_PRIORITY>20</WORKFLOW_PRIORITY> |
|
21 |
<CONFIGURATION start="manual"> |
|
22 |
<NODE name="VerifyDatasource" type="VerifyDatasource" isStart="true"> |
|
23 |
<DESCRIPTION>Verify if DS is pending</DESCRIPTION> |
|
24 |
<PARAMETERS> |
|
25 |
<PARAM name="expectedInterfaceTypologyPrefixes" managedBy="system" required="false" type="string">entityregistry::projects</PARAM> |
|
26 |
<PARAM name="expectedCompliancePrefixes" managedBy="system" required="false" type="string">native</PARAM> |
|
27 |
</PARAMETERS> |
|
28 |
<ARCS> |
|
29 |
<ARC to="createMetaWf"/> |
|
30 |
<ARC to="validateDs" name="validateDs"/> |
|
31 |
</ARCS> |
|
32 |
</NODE> |
|
33 |
|
|
34 |
<NODE name="validateDs" type="ValidateDatasource"> |
|
35 |
<DESCRIPTION>Validate DS</DESCRIPTION> |
|
36 |
<PARAMETERS/> |
|
37 |
<ARCS> |
|
38 |
<ARC to="createMetaWf"/> |
|
39 |
</ARCS> |
|
40 |
</NODE> |
|
41 |
|
|
42 |
<NODE name="createMetaWf" type="RegisterMetaWf"> |
|
43 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
44 |
<PARAMETERS> |
|
45 |
<PARAM name="wfName" managedBy="system" required="true" type="string">Aggregate Projects, Fundings and Contextes [Ingestion]</PARAM> |
|
46 |
</PARAMETERS> |
|
47 |
<ARCS> |
|
48 |
<ARC to="createGMF"/> |
|
49 |
<ARC to="createDBMF"/> |
|
50 |
</ARCS> |
|
51 |
</NODE> |
|
52 |
|
|
53 |
<NODE name="createGMF" type="CreateMDStore"> |
|
54 |
<DESCRIPTION>Create store for native records</DESCRIPTION> |
|
55 |
<PARAMETERS> |
|
56 |
<PARAM name="format" managedBy="system" required="true" type="string">GMF</PARAM> |
|
57 |
<PARAM name="interpretation" managedBy="system" required="true" type="string">native</PARAM> |
|
58 |
<PARAM name="layout" managedBy="system" required="true" type="string">store</PARAM> |
|
59 |
<PARAM name="outputPrefix" managedBy="system" required="true" type="string">orig_</PARAM> |
|
60 |
</PARAMETERS> |
|
61 |
<ARCS> |
|
62 |
<ARC to="updateMetaWf"/> |
|
63 |
</ARCS> |
|
64 |
</NODE> |
|
65 |
<NODE name="createDBMF" type="CreateMDStore"> |
|
66 |
<DESCRIPTION>Create store for DB rows</DESCRIPTION> |
|
67 |
<PARAMETERS> |
|
68 |
<PARAM name="format" managedBy="system" required="true" type="string">DBMF</PARAM> |
|
69 |
<PARAM name="interpretation" managedBy="system" required="true" type="string">cleaned</PARAM> |
|
70 |
<PARAM name="layout" managedBy="system" required="true" type="string">store</PARAM> |
|
71 |
<PARAM name="outputPrefix" managedBy="system" required="true" type="string">row_</PARAM> |
|
72 |
</PARAMETERS> |
|
73 |
<ARCS> |
|
74 |
<ARC to="updateMetaWf"/> |
|
75 |
</ARCS> |
|
76 |
</NODE> |
|
77 |
|
|
78 |
<NODE name="updateMetaWf" type="UpdateMetaWf" isJoin="true"> |
|
79 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
80 |
<PARAMETERS> |
|
81 |
<PARAM name="beanName" managedBy="system" required="true" type="string">metaWfEntityRegProjects</PARAM> |
|
82 |
</PARAMETERS> |
|
83 |
<ARCS> |
|
84 |
<ARC to="updateMetaWfStatus"/> |
|
85 |
</ARCS> |
|
86 |
</NODE> |
|
87 |
|
|
88 |
<NODE name="updateMetaWfStatus" type="UpdateOpenaireMetaWfStatus"> |
|
89 |
<DESCRIPTION>Update MetaWorkflow Status</DESCRIPTION> |
|
90 |
<PARAMETERS/> |
|
91 |
<ARCS> |
|
92 |
<ARC to="success"/> |
|
93 |
</ARCS> |
|
94 |
</NODE> |
|
95 |
</CONFIGURATION> |
|
96 |
|
|
97 |
<STATUS/> |
|
98 |
</BODY> |
|
99 |
</RESOURCE_PROFILE> |
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/repo-hi/Extract_Contexts_from_EntityRegistry_Native.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER |
|
5 |
value="fa0b0a7b-383d-40d5-a3ef-5605b3e62f26_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
6 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
7 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
8 |
<RESOURCE_URI value="value3"/> |
|
9 |
<DATE_OF_CREATION value="2013-03-03T11:13:51.0Z"/> |
|
10 |
</HEADER> |
|
11 |
<BODY> |
|
12 |
<WORKFLOW_NAME>[DEPRECATED] Aggregate project contexts from EntityRegistry [Ingestion]</WORKFLOW_NAME> |
|
13 |
<WORKFLOW_INFO> |
|
14 |
<FIELD name="Action">Aggregate contexts</FIELD> |
|
15 |
<FIELD name="Consequence IS">Ingestion</FIELD> |
|
16 |
<FIELD name="Datasource class">EntityRegistry</FIELD> |
|
17 |
<FIELD name="Content">project contexts</FIELD> |
|
18 |
</WORKFLOW_INFO> |
|
19 |
<WORKFLOW_TYPE>REPO_HI</WORKFLOW_TYPE> |
|
20 |
<WORKFLOW_PRIORITY>20</WORKFLOW_PRIORITY> |
|
21 |
<CONFIGURATION start="manual"> |
|
22 |
<NODE name="VerifyDatasource" type="VerifyDatasource" isStart="true"> |
|
23 |
<DESCRIPTION>Verify if DS is pending</DESCRIPTION> |
|
24 |
<PARAMETERS> |
|
25 |
<PARAM name="expectedInterfaceTypologyPrefixes" managedBy="system" required="false" type="string">entityregistry::projects</PARAM> |
|
26 |
<PARAM name="expectedCompliancePrefixes" managedBy="system" required="false" type="string">native</PARAM> |
|
27 |
</PARAMETERS> |
|
28 |
<ARCS> |
|
29 |
<ARC to="createMetaWf"/> |
|
30 |
<ARC to="validateDs" name="validateDs"/> |
|
31 |
</ARCS> |
|
32 |
</NODE> |
|
33 |
|
|
34 |
<NODE name="validateDs" type="ValidateDatasource"> |
|
35 |
<DESCRIPTION>Validate DS</DESCRIPTION> |
|
36 |
<PARAMETERS/> |
|
37 |
<ARCS> |
|
38 |
<ARC to="createMetaWf"/> |
|
39 |
</ARCS> |
|
40 |
</NODE> |
|
41 |
|
|
42 |
<NODE name="createMetaWf" type="RegisterMetaWf"> |
|
43 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
44 |
<PARAMETERS> |
|
45 |
<PARAM name="wfName" managedBy="system" required="true" type="string">Aggregate project contexts from EntityRegistry [Ingestion]</PARAM> |
|
46 |
</PARAMETERS> |
|
47 |
<ARCS> |
|
48 |
<ARC to="updateMetaWf"/> |
|
49 |
</ARCS> |
|
50 |
</NODE> |
|
51 |
|
|
52 |
<NODE name="updateMetaWf" type="UpdateMetaWf" isJoin="true"> |
|
53 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
54 |
<PARAMETERS> |
|
55 |
<PARAM name="beanName" managedBy="system" required="true" type="string">metaWfContextsEntityReg</PARAM> |
|
56 |
</PARAMETERS> |
|
57 |
<ARCS> |
|
58 |
<ARC to="updateMetaWfStatus"/> |
|
59 |
</ARCS> |
|
60 |
</NODE> |
|
61 |
|
|
62 |
<NODE name="updateMetaWfStatus" type="UpdateOpenaireMetaWfStatus"> |
|
63 |
<DESCRIPTION>Update MetaWorkflow Status</DESCRIPTION> |
|
64 |
<PARAMETERS/> |
|
65 |
<ARCS> |
|
66 |
<ARC to="success"/> |
|
67 |
</ARCS> |
|
68 |
</NODE> |
|
69 |
</CONFIGURATION> |
|
70 |
|
|
71 |
<STATUS/> |
|
72 |
</BODY> |
|
73 |
</RESOURCE_PROFILE> |
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/repo-hi/Fill_HostedbyMap_journal.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER |
|
5 |
value="3671f84d-177b-4732-b795-8d8ed8603964_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
6 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
7 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
8 |
<RESOURCE_URI value="value3"/> |
|
9 |
<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z"/> |
|
10 |
</HEADER> |
|
11 |
<BODY> |
|
12 |
<WORKFLOW_NAME>Fill hostedBy-Map (ISSNs) [Context]</WORKFLOW_NAME> |
|
13 |
<WORKFLOW_INFO> |
|
14 |
<FIELD name="Action">Fill hostedBy-Map</FIELD> |
|
15 |
<FIELD name="Consequence IS">Context</FIELD> |
|
16 |
<FIELD name="Datasource class">EntityRegistry, Aggregator</FIELD> |
|
17 |
<FIELD name="Content">ISSNs</FIELD> |
|
18 |
</WORKFLOW_INFO> |
|
19 |
<WORKFLOW_TYPE>REPO_HI</WORKFLOW_TYPE> |
|
20 |
<WORKFLOW_PRIORITY>20</WORKFLOW_PRIORITY> |
|
21 |
<CONFIGURATION start="manual"> |
|
22 |
<NODE name="VerifyDatasource" type="VerifyDatasource" isStart="true"> |
|
23 |
<DESCRIPTION>Verify if DS is pending</DESCRIPTION> |
|
24 |
<PARAMETERS> |
|
25 |
<PARAM name="expectedInterfaceTypologyPrefixes" managedBy="system" required="false" type="string">entityregistry,aggregator::pubsrepository</PARAM> |
|
26 |
<PARAM name="expectedCompliancePrefixes" managedBy="system" required="false" type="string">native</PARAM> |
|
27 |
</PARAMETERS> |
|
28 |
<ARCS> |
|
29 |
<ARC to="createMetaWf"/> |
|
30 |
<ARC to="validateDs" name="validateDs"/> |
|
31 |
</ARCS> |
|
32 |
</NODE> |
|
33 |
|
|
34 |
<NODE name="validateDs" type="ValidateDatasource"> |
|
35 |
<DESCRIPTION>Validate DS</DESCRIPTION> |
|
36 |
<PARAMETERS/> |
|
37 |
<ARCS> |
|
38 |
<ARC to="createMetaWf"/> |
|
39 |
</ARCS> |
|
40 |
</NODE> |
|
41 |
|
|
42 |
<NODE name="createMetaWf" type="RegisterMetaWf"> |
|
43 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
44 |
<PARAMETERS> |
|
45 |
<PARAM name="wfName" managedBy="system" required="true" type="string">Fill hostedBy-Map (ISSNs) [Context]</PARAM> |
|
46 |
</PARAMETERS> |
|
47 |
<ARCS> |
|
48 |
<ARC to="updateMetaWf"/> |
|
49 |
</ARCS> |
|
50 |
</NODE> |
|
51 |
|
|
52 |
|
|
53 |
<NODE name="updateMetaWf" type="UpdateMetaWf" isJoin="true"> |
|
54 |
<DESCRIPTION>Create MetaWorkflow</DESCRIPTION> |
|
55 |
<PARAMETERS> |
|
56 |
<PARAM name="beanName" managedBy="system" required="true" type="string">metaWfHostedByMapJournal</PARAM> |
|
57 |
</PARAMETERS> |
|
58 |
<ARCS> |
|
59 |
<ARC to="updateMetaWfStatus"/> |
|
60 |
</ARCS> |
|
61 |
</NODE> |
|
62 |
|
|
63 |
<NODE name="updateMetaWfStatus" type="UpdateOpenaireMetaWfStatus"> |
|
64 |
<DESCRIPTION>Update MetaWorkflow Status</DESCRIPTION> |
|
65 |
<PARAMETERS/> |
|
66 |
<ARCS> |
|
67 |
<ARC to="success"/> |
|
68 |
</ARCS> |
|
69 |
</NODE> |
|
70 |
</CONFIGURATION> |
|
71 |
|
|
72 |
<STATUS/> |
|
73 |
</BODY> |
|
74 |
</RESOURCE_PROFILE> |
modules/dnet-openaireplus-workflows/branches/solr6/src/main/resources/eu/dnetlib/test/profiles/openaireplus/workflows/repo-hi/Aggregate_Metadata_from_DataRepository_Inference.xml | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<RESOURCE_PROFILE> |
|
3 |
<HEADER> |
|
4 |
<RESOURCE_IDENTIFIER value="0cfc367d-dd4e-4c8f-bc95-c37499638985_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/> |
|
5 |
<RESOURCE_TYPE value="WorkflowDSResourceType"/> |
|
6 |
<RESOURCE_KIND value="WorkflowDSResources"/> |
|
7 |
<RESOURCE_URI value="value3"/> |
|
8 |
<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z"/> |
|
9 |
</HEADER> |
|
10 |
<BODY> |
|
11 |
<WORKFLOW_NAME>Aggregate Metadata (datasets) from DataRepository [Inference]</WORKFLOW_NAME> |
|
12 |
<WORKFLOW_INFO> |
|
13 |
<FIELD name="Action">Aggregate Metadata</FIELD> |
|
14 |
<FIELD name="Consequence IS">Inference</FIELD> |
|
15 |
<FIELD name="Datasource class">DataRepository</FIELD> |
|
16 |
<FIELD name="Content">datasets</FIELD> |
|
17 |
</WORKFLOW_INFO> |
|
18 |
<WORKFLOW_TYPE>REPO_HI</WORKFLOW_TYPE> |
|
19 |
<WORKFLOW_PRIORITY>20</WORKFLOW_PRIORITY> |
|
20 |
<CONFIGURATION start="manual"> |
|
21 |
<NODE name="VerifyDatasource" type="VerifyDatasource" isStart="true"> |
|
22 |
<DESCRIPTION>Verify if DS is pending</DESCRIPTION> |
|
23 |
<PARAMETERS> |
|
24 |
<PARAM name="expectedInterfaceTypologyPrefixes" managedBy="system" required="false" type="string">datarepository</PARAM> |
|
25 |
<PARAM name="expectedCompliancePrefixes" managedBy="system" required="false" type="string"></PARAM> |
|
26 |
</PARAMETERS> |
|
27 |
<ARCS> |
|
28 |
<ARC to="createMetaWf"/> |
|
29 |
<ARC to="validateDs" name="validateDs"/> |
|
30 |
</ARCS> |
|
31 |
</NODE> |
|
32 |
|
|
33 |
<NODE name="validateDs" type="ValidateDatasource"> |
|
34 |
<DESCRIPTION>Validate DS</DESCRIPTION> |
|
35 |
<PARAMETERS/> |
|
36 |
<ARCS> |
Also available in: Unified diff
hopefully we won't need to branch also this