Project

General

Profile

1
<?xml version="1.0" encoding="UTF-8"?>
2
<RESOURCE_PROFILE>
3
	<HEADER>
4
		<RESOURCE_IDENTIFIER
5
				value="e03f256e-1e4d-4b3d-9c07-91faf5d25210_V29ya2Zsb3dEU1Jlc291cmNlcy9Xb3JrZmxvd0RTUmVzb3VyY2VUeXBl"/>
6
		<RESOURCE_TYPE value="WorkflowDSResourceType"/>
7
		<RESOURCE_KIND value="WorkflowDSResources"/>
8
		<RESOURCE_URI value=""/>
9
		<DATE_OF_CREATION value="2006-05-04T18:13:51.0Z"/>
10
	</HEADER>
11
	<BODY>
12
		<WORKFLOW_NAME>Import ScholExplorer Links and entities</WORKFLOW_NAME>
13
		<WORKFLOW_TYPE>Import InfoSpace</WORKFLOW_TYPE>
14
		<WORKFLOW_PRIORITY>30</WORKFLOW_PRIORITY>
15
		<CONFIGURATION start="manual">
16
            <NODE name="setInputPath" isStart="true" type="SetHdfsFile">
17
                <DESCRIPTION>set the hdfs output path</DESCRIPTION>
18
                <PARAMETERS>
19
                    <PARAM managedBy="user" name="hdfsPath" required="true" type="string">/usr/dnet/dli/export/scolixDumpExport</PARAM>
20
                    <PARAM managedBy="system" name="hdfsPathParam" required="true" type="string">inputPath</PARAM>
21
                </PARAMETERS>
22
                <ARCS>
23
                    <ARC to="prepareActionSets"/>
24
                </ARCS>
25
            </NODE>
26
			<NODE name="prepareActionSets" type="PrepareActionSets">
27
				<DESCRIPTION>prepare action sets</DESCRIPTION>
28
				<PARAMETERS>
29
					<PARAM required="true" type="string" name="sets" managedBy="system">
30
						[
31
						{
32
						'set' : 'scholexplorer-dump',
33
						'jobProperty' : 'export_action_set_scholexplorer_dump',
34
						'enablingProperty' : 'active_scholexplorer_dump',
35
						'enabled' : 'true'
36
						}
37
						]
38
					</PARAM>
39
				</PARAMETERS>
40
				<ARCS>
41
					<ARC to="extractOutputPath"/>
42
				</ARCS>
43
			</NODE>
44

    
45
            <NODE name="extractOutputPath"  type="ExtractOutputPath">
46
                <DESCRIPTION>extract the hdfs output path generated in the previous node</DESCRIPTION>
47
                <PARAMETERS>
48
                    <PARAM managedBy="system" name="hdfsOutputPathParam" required="true" type="string">outputPath</PARAM>
49

    
50
                </PARAMETERS>
51
                <ARCS>
52
                    <ARC to="importActionSet"/>
53
                </ARCS>
54
            </NODE>
55

    
56
			<NODE name="importActionSet" type="SubmitHadoopJob" isJoin="true">
57
				<DESCRIPTION>IIS main</DESCRIPTION>
58
				<PARAMETERS>
59
					<PARAM required="true" type="string" name="hadoopJob" managedBy="system">importScholexplorerJob</PARAM>
60
					<PARAM required="true" type="string" name="cluster" managedBy="system">DM</PARAM>
61
					<PARAM required="true" type="string" name="envParams" managedBy="system">
62
						{
63
						'cluster' : 'cluster',
64
						'mapred.input.dir':'inputPath',
65
                        'mapred.output.dir':'outputPath'
66
						}
67
					</PARAM>
68
					<PARAM required="true" type="boolean" name="simulation" managedBy="user">false</PARAM>
69
				</PARAMETERS>
70
				<ARCS>
71
					<ARC to="updateActionSets"/>
72
				</ARCS>
73
			</NODE>
74
			<NODE name="updateActionSets" type="UpdateActionSets">
75
				<DESCRIPTION>update action sets</DESCRIPTION>
76
				<PARAMETERS/>
77
				<ARCS>
78
					<ARC to="success"/>
79
				</ARCS>
80
			</NODE>
81
		</CONFIGURATION>
82
		<STATUS/>
83
	</BODY>
84
</RESOURCE_PROFILE>
(8-8/12)