Project

General

Profile

1
<?xml version="1.0" encoding="UTF-8"?>
2
<RESOURCE_PROFILE xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
3
	<HEADER>
4
		<RESOURCE_IDENTIFIER
5
			value="c7d7d775-2db3-474d-85ab-5173a582d515_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl" />
6
		<RESOURCE_TYPE value="WorkflowDSResourceType" />
7
		<RESOURCE_KIND value="WorkflowDSResources" />
8
		<RESOURCE_URI value="" />
9
		<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z" />
10
	</HEADER>
11
	<BODY>
12
		<WORKFLOW_NAME>MDStores to HBase</WORKFLOW_NAME>
13
		<WORKFLOW_TYPE>Data Load</WORKFLOW_TYPE>
14
		<WORKFLOW_PRIORITY>30</WORKFLOW_PRIORITY>
15
		<CONFIGURATION start="auto">
16
			<NODE name="prepareImport" type="PrepareMDStoreImport" isStart="true">
17
				<DESCRIPTION>Configure export to HDFS</DESCRIPTION>
18
				<PARAMETERS>
19
					<PARAM required="true" type="string" name="hdfsPathParam" managedBy="system">hdfsPath</PARAM>
20
					<PARAM required="true" type="string" name="hdfsPath" managedBy="system">/tmp/mdstores_oaf-store-cleaned.seq</PARAM>
21
					<PARAM required="true" type="string" name="xsltParam" managedBy="system">xslt</PARAM>
22
					<PARAM required="true" type="string" name="xslt" managedBy="system">/eu/dnetlib/data/transform/dmf_2_hbase.xsl</PARAM>					
23
				</PARAMETERS>
24
				<ARCS>
25
					<ARC to="storeHdfsRecords" />
26
				</ARCS>
27
			</NODE>
28
			<NODE name="exportRecords" type="MDStoreBatchExporter" isStart="true">
29
				<DESCRIPTION>Fetch mdstore records</DESCRIPTION>
30
				<PARAMETERS>
31
					<PARAM required="true" type="string" name="format" managedBy="system">OAF</PARAM>
32
					<PARAM required="true" type="string" name="layout" managedBy="system">store</PARAM>
33
					<PARAM required="true" type="string" name="interpretation" managedBy="system">cleaned</PARAM>
34
					<PARAM required="true" type="string" name="outputEprParam" managedBy="system">records_epr</PARAM>
35
				</PARAMETERS>
36
				<ARCS>
37
					<ARC to="storeHdfsRecords" />
38
				</ARCS>
39
			</NODE>
40
			<NODE name="storeHdfsRecords" type="StoreHdfsRecords" isJoin="true">
41
				<DESCRIPTION>Store records to HDFS</DESCRIPTION>
42
				<PARAMETERS>
43
					<PARAM required="true" type="string" name="inputEprParam" managedBy="system">records_epr</PARAM>
44
					<PARAM required="true" type="string" name="hdfsPathParam" managedBy="system">hdfsPath</PARAM>
45
					<PARAM required="true" type="string" name="cluster" managedBy="system">DM</PARAM>					
46
				</PARAMETERS>
47
				<ARCS>
48
					<ARC to="mapreduce" />
49
				</ARCS>
50
			</NODE>			
51
			<NODE name="mapreduce" type="SubmitHadoopJob" isJoin="true">
52
				<DESCRIPTION>Run M/R import Job</DESCRIPTION>
53
				<PARAMETERS>
54
					<PARAM required="true" type="string" name="cluster" managedBy="system">DM</PARAM>
55
					<PARAM required="true" type="string" name="hadoopJob" managedBy="system">mdStoreHdfsImportJob</PARAM>
56
					<PARAM required="true" type="string" name="envParams" managedBy="system">
57
						{ 
58
							'mapred.input.dir' : 'hdfsPath', 
59
							'hbase.import.xslt' : 'xslt'
60
						}
61
					</PARAM>	
62
					<PARAM required="true" type="string" name="sysParams" managedBy="system">
63
						{ 
64
							'hbase.mapred.outputtable' : 'hbase.mapred.datatable'
65
						}
66
					</PARAM>
67
				</PARAMETERS>
68
				<ARCS>
69
					<ARC to="success" />
70
				</ARCS>
71
			</NODE>
72
		</CONFIGURATION>
73
		<STATUS />
74
	</BODY>
75
</RESOURCE_PROFILE>
76

    
77

    
(3-3/5)