Project

General

Profile

1
<RESOURCE_PROFILE>
2
	<HEADER>
3
		<RESOURCE_IDENTIFIER value="a1b0b30c-7e19-46e2-888c-67c0b880b346_V29ya2Zsb3dUZW1wbGF0ZURTUmVzb3VyY2VzL1dvcmtmbG93VGVtcGxhdGVEU1Jlc291cmNlVHlwZQ=="/>
4
		<RESOURCE_TYPE value="WorkflowTemplateDSResourceType"/>
5
		<RESOURCE_KIND value="WorkflowTemplateDSResources"/>
6
		<RESOURCE_URI value=""/>
7
		<DATE_OF_CREATION value="2016-06-25T10:24:32+00:00"/>
8
	</HEADER>
9
	<BODY>
10
		<CONFIGURATION>
11

    
12
			<PARAMETERS>
13
				<PARAM name="hbaseTable" description="HBase table name" required="true" type="string"/>
14
				<PARAM name="cluster" description="Hadoop cluster name" required="true" type="string"/>
15

    
16
				<PARAM name="dedupConfigSequence" description="dedup configuration orchestration name" required="true" type="string"/>
17

    
18
				<PARAM name="mdFormat" description="dedup index mdFormat" required="true" type="string" default="OPENAIRE"/>
19
				<PARAM name="layout" description="dedup index layout" required="true" type="string" default="index"/>
20
				<PARAM name="interpretation" description="dedup index interpretation" required="true" type="string" default="dedup"/>
21
			</PARAMETERS>
22

    
23
			<WORKFLOW>
24

    
25
				<NODE isStart="true" name="setDedupConfigs" type="SetDedupConfiguration">
26
					<DESCRIPTION>Set Dedup conf</DESCRIPTION>
27
					<PARAMETERS>
28
						<PARAM name="dedupConfigSequence" ref="dedupConfigSequence"/>
29
						<PARAM name="dedupConfigSequenceParam" value="dedup.conf.queue"/>
30
						<PARAM name="entityTypeNameParam" value="entityType"/>
31
						<PARAM name="entityTypeIdParam" value="entityTypeId"/>
32
					</PARAMETERS>
33
					<ARCS>
34
						<ARC to="findIndex"/>
35
					</ARCS>
36
				</NODE>
37

    
38
				<NODE name="findIndex" type="FindIndex">
39
					<DESCRIPTION/>
40
					<PARAMETERS>
41
						<PARAM name="mdFormat" ref="mdFormat"/>
42
						<PARAM name="layout" ref="layout"/>
43
						<PARAM name="interpretation" ref="interpretation"/>
44
					</PARAMETERS>
45
					<ARCS>
46
						<ARC name="found" to="prepareIndex"/>
47
						<ARC name="notFound" to="createIndex"/>
48
					</ARCS>
49
				</NODE>
50

    
51
				<NODE name="createIndex" type="CreateIndex">
52
					<DESCRIPTION/>
53
					<PARAMETERS>
54
						<PARAM name="format" ref="mdFormat"/>
55
						<PARAM name="layout" ref="layout"/>
56
						<PARAM name="interpretation" ref="interpretation"/>
57
					</PARAMETERS>
58
					<ARCS>
59
						<ARC to="prepareIndex"/>
60
					</ARCS>
61
				</NODE>
62

    
63
				<NODE name="prepareIndex" type="PrepareDedupIndexJob">
64
					<DESCRIPTION>Prepare indexing</DESCRIPTION>
65
					<PARAMETERS>
66
						<PARAM name="mdFormat" ref="mdFormat"/>
67
						<PARAM name="layout" ref="layout"/>
68
						<PARAM name="interpretation" ref="interpretation"/>
69
						<PARAM name="rottenRecordsPathParam" value="rottenRecordsPath"/>
70
						<PARAM name="hbaseTable" ref="hbaseTable"/>
71
					</PARAMETERS>
72
					<ARCS>
73
						<ARC to="cleanupRotten"/>
74
					</ARCS>
75
				</NODE>
76

    
77
				<NODE name="cleanupRotten" type="DeleteHdfsPathJob">
78
					<DESCRIPTION>hdfs cleanup (rotten)</DESCRIPTION>
79
					<PARAMETERS>
80
						<PARAM name="cluster" ref="cluster"/>
81
						<PARAM name="path" env="rottenRecordsPath"/>
82
					</PARAMETERS>
83
					<ARCS>
84
						<ARC to="updateIndex"/>
85
					</ARCS>
86
				</NODE>
87

    
88
				<NODE name="updateIndex" type="SubmitHadoopJob">
89
					<DESCRIPTION>M/O index records</DESCRIPTION>
90
					<PARAMETERS>
91
						<PARAM name="hadoopJob" value="dedupIndexFeedJob"/>
92
						<PARAM name="cluster" ref="cluster"/>
93
						<PARAM name="jobParams">
94
							<MAP>
95
								<ENTRY key="hbase.mapred.inputtable" ref="hbaseTable"/>
96
								<ENTRY key="hbase.mapreduce.inputtable" ref="hbaseTable"/>
97
								<ENTRY key="mapred.output.dir" env="rottenRecordsPath"/>
98
								<ENTRY key="index.fields" env="index.fields"/>
99
								<ENTRY key="index.solr.url" env="index.solr.url"/>
100
								<ENTRY key="index.solr.collection" env="index.solr.collection"/>
101
								<ENTRY key="index.buffer.flush.threshold" env="index.buffer.flush.threshold"/>
102
								<ENTRY key="index.shutdown.wait.time" env="index.shutdown.wait.time"/>
103
								<ENTRY key="index.solr.sim.mode" env="index.solr.sim.mode"/>
104
								<ENTRY key="index.feed.timestamp" env="index.feed.timestamp"/>
105
								<ENTRY key="entityTypeId" env="entityTypeId"/>
106
								<ENTRY key="entityType" env="entityType"/>
107
								<ENTRY key="actionset" ref="dedupConfigSequence"/>
108
							</MAP>
109
						</PARAM>
110
					</PARAMETERS>
111
					<ARCS>
112
						<ARC to="finalize"/>
113
					</ARCS>
114
				</NODE>
115

    
116
				<NODE name="finalize" type="FinalizeDedupIndexFeeding">
117
					<DESCRIPTION>commit changes</DESCRIPTION>
118
					<PARAMETERS>
119
						<PARAM name="actionset" ref="dedupConfigSequence"/>
120
					</PARAMETERS>
121
					<ARCS>
122
						<ARC to="updateDs"/>
123
					</ARCS>
124
				</NODE>
125

    
126
				<NODE name="updateDs" type="IndexDsUpdateJob">
127
					<DESCRIPTION>update DS</DESCRIPTION>
128
					<PARAMETERS/>
129
					<ARCS>
130
						<ARC to="success"/>
131
					</ARCS>
132
				</NODE>
133

    
134

    
135
			</WORKFLOW>
136

    
137
		</CONFIGURATION>
138

    
139
	</BODY>
140
</RESOURCE_PROFILE>
(5-5/23)