Project

General

Profile

1
<workflow-app xmlns="uri:oozie:workflow:0.4" name="mainworkflows_primary_main">
2
	
3
	<parameters>
4
		<!-- processing modes -->
5
		<property>
6
			<name>active_metadataextraction_export</name>
7
			<value>false</value>
8
			<description>flag indicating metadata extraction export should be enabled</description>
9
		</property>
10
		<property>
11
			<name>active_referenceextraction_project</name>
12
			<value>false</value>
13
			<description>flag indicating project reference extraction should be enabled</description>
14
		</property>
15
		<property>
16
			<name>active_referenceextraction_dataset</name>
17
			<value>false</value>
18
			<description>flag indicating dataset reference extraction should be enabled</description>
19
		</property>
20
		<property>
21
			<!-- currently disabled by default -->
22
			<name>active_referenceextraction_researchinitiative</name>
23
			<value>false</value>
24
			<description>flag indicating researchinitiative reference extraction should be enabled</description>
25
		</property>
26
		<property>
27
			<name>active_documentsclassification</name>
28
			<value>false</value>
29
			<description>flag indicating documents classification should be enabled</description>
30
		</property>
31
		<property>
32
			<name>active_documentssimilarity</name>
33
			<value>false</value>
34
			<description>flag indicating documents similarity should be enabled</description>
35
		</property>
36
		<property>
37
			<name>active_citationmatching</name>
38
			<value>false</value>
39
			<description>flag indicating citation matching should be enabled</description>
40
		</property>
41
		<property>
42
			<name>active_statistics</name>
43
			<value>false</value>
44
			<description>flag indicating statistics generation should be enabled</description>
45
		</property>
46
		<!-- import metadata related -->
47
		<property>
48
			<name>import_hbase_input_table</name>
49
			<description>HBase input table holding InformationSpace, available on local cluster</description>
50
		</property>
51
		<property>
52
			<name>import_hbase_approved_datasources_csv</name>
53
			<value>$UNDEFINED$</value>
54
			<description>CSV list of datasource ids to be approved during import. Applied on result and person entities.</description>
55
		</property>
56
		<!-- import datacite related -->
57
		<property>
58
			<name>import_mdstore_service_location</name>
59
			<value>$UNDEFINED$</value>
60
			<description>MDStore service (not WSDL) location URL</description>
61
		</property>
62
		<property>
63
			<name>import_dataset_mdstore_ids_csv</name>
64
			<value>$UNDEFINED$</value>
65
			<description>MDStore identifier</description>
66
		</property>
67
		<!-- import content related -->
68
		<property>
69
			<name>import_content_object_store_location</name>
70
			<value>$UNDEFINED$</value>
71
			<description>object store service location required for content retrieval</description>
72
		</property>
73
		<property>
74
			<name>import_content_objectstores_csv</name>
75
			<value>$UNDEFINED$</value>
76
			<description>CSV list of object stores identifiers to be processed</description>
77
		</property>
78
		<property>
79
			<name>import_content_mimetypes_pdf</name>
80
			<value>pdf,application/pdf</value>
81
			<description>pdf mime types</description>
82
		</property>
83
		<property>
84
			<name>import_content_mimetypes_text</name>
85
			<value>text,text/plain</value>
86
			<description>text mime types</description>
87
		</property>
88
		<property>
89
			<name>import_content_mimetypes_xml_pmc</name>
90
			<value>xml</value>
91
			<description>xml pmc types</description>
92
		</property>
93
		<property>
94
			<name>import_content_mimetypes_wos</name>
95
			<value>file::WoS</value>
96
			<description>WoS types</description>
97
		</property>
98
		<!-- import timeouts related -->
99
		<property>
100
			<name>import_resultset_client_read_timeout</name>
101
			<value>60000</value>
102
			<description>resultset client read timeout</description>
103
		</property>
104
		<property>
105
			<name>import_content_connection_timeout</name>
106
			<value>60000</value>
107
			<description>import content connection timeout</description>
108
		</property>
109
		<property>
110
			<name>import_content_read_timeout</name>
111
			<value>60000</value>
112
			<description>import content read timeout</description>
113
		</property>
114
		<!-- metadata extraction related -->
115
		<property>
116
			<name>metadataextraction_excluded_ids</name>
117
			<value>$UNDEFINED$</value>
118
			<description>list of content identifiers excluded from metadataextraction processing</description>
119
		</property>
120
		<property>
121
			<name>metadataextraction_default_cache_location</name>
122
			<value>/cache/metadataextraction</value>
123
			<description>metadata extraction HDFS cache location</description>
124
		</property>
125
		<property>
126
			<name>metadataextraction_processing_mode</name>
127
			<value>StreamingMetadataExtractorMapper</value>
128
			<description>metadata extraction processing mode</description>
129
		</property>
130
		<property>
131
			<name>metadataextraction_input_classname</name>
132
			<value>eu.dnetlib.iis.importer.auxiliary.schemas.DocumentContentUrl</value>
133
			<description>metadata extraction input classname</description>
134
		</property>
135
		<!-- export related -->
136
		<property>
137
			<name>export_action_hbase_table_name</name>
138
			<description>action manager hbase table name</description>
139
		</property>
140
		<property>
141
			<name>export_action_hbase_table_initialize</name>
142
			<description>flag indicating input table should be initialized</description>
143
		</property>
144
		<!-- action set id properties -->
145
		<property>
146
			<name>export_action_set_id</name>
147
			<value>$UNDEFINED$</value>
148
			<description>action-set identifier of exported data</description>
149
		</property>
150
		<property>
151
			<name>export_action_set_id_dataset_similarities_websiteusage</name>
152
			<value>$UNDEFINED$</value>
153
			<description>dataset_similarities_websiteusage action-set identifier of exported data</description>
154
		</property>
155
		<property>
156
			<name>export_action_set_id_person_similarities_websiteusage</name>
157
			<value>$UNDEFINED$</value>
158
			<description>person_similarities_websiteusage action-set identifier of exported data</description>
159
		</property>
160
		<property>
161
			<name>export_action_set_id_person_statistics</name>
162
			<value>$UNDEFINED$</value>
163
			<description>person_statistics action-set identifier of exported data</description>
164
		</property>
165
		<property>
166
			<name>export_action_set_id_project_statistics</name>
167
			<value>$UNDEFINED$</value>
168
			<description>project_statistics action-set identifier of exported data</description>
169
		</property>
170
		<property>
171
			<name>export_action_set_id_document_similarities_standard</name>
172
			<value>$UNDEFINED$</value>
173
			<description>document_similarities_standard action-set identifier of exported data</description>
174
		</property>
175
		<property>
176
			<name>export_action_set_id_document_similarities_websiteusage</name>
177
			<value>$UNDEFINED$</value>
178
			<description>document_similarities_websiteusage action-set identifier of exported data</description>
179
		</property>
180
		<property>
181
			<name>export_action_set_id_document_extractedMetadata</name>
182
			<value>$UNDEFINED$</value>
183
			<description>document_extractedMetadata action-set identifier of exported data</description>
184
		</property>
185
		<property>
186
			<name>export_action_set_id_document_statistics</name>
187
			<value>$UNDEFINED$</value>
188
			<description>document_statistics action-set identifier of exported data</description>
189
		</property>
190
		<property>
191
			<name>export_action_set_id_document_classes</name>
192
			<value>$UNDEFINED$</value>
193
			<description>document_classes action-set identifier of exported data</description>
194
		</property>
195
		<property>
196
			<name>export_action_set_id_document_referencedProjects</name>
197
			<value>$UNDEFINED$</value>
198
			<description>document_referencedProjects action-set identifier of exported data</description>
199
		</property>
200
		<property>
201
			<name>export_action_set_id_document_referencedDatasets</name>
202
			<value>$UNDEFINED$</value>
203
			<description>document_referencedDatasets action-set identifier of exported data</description>
204
		</property>
205
		<property>
206
			<name>export_action_set_id_document_referencedDocuments</name>
207
			<value>$UNDEFINED$</value>
208
			<description>document_referencedDocuments action-set identifier of exported data</description>
209
		</property>
210
		<property>
211
			<name>export_action_set_id_document_research_initiative</name>
212
			<value>$UNDEFINED$</value>
213
			<description>document research initiative action-set identifier of exported data</description>
214
		</property>
215
		<!--  -->
216
		<property>
217
			<name>export_action_set_id_entity_dataset</name>
218
			<description>action-set identifier of exported data containing dataset entities</description>
219
		</property>
220
		<property>
221
			<name>export_action_hbase_remote_zookeeper_quorum</name>
222
			<value>$UNDEFINED$</value>
223
			<description>external hbase zookeeper quorum, set to empty value by default which means data will be exported to local hbase instance</description>
224
		</property>
225
		<property>
226
			<name>export_action_hbase_remote_zookeeper_clientport</name>
227
			<value>$UNDEFINED$</value>
228
			<description>external hbase zookeeper client port, required only whe zookeeper quorum property is set</description>
229
		</property>
230
		<property>
231
			<name>export_documentssimilarity_threshold</name>
232
			<value>$UNDEFINED$</value>
233
			<description>documents similarity threshold value below which similarity export is omitted</description>
234
		</property>
235
	</parameters>
236
	
237
	<global>
238
        <job-tracker>${jobTracker}</job-tracker>
239
        <name-node>${nameNode}</name-node>
240
        <configuration>
241
            <property>
242
                <name>mapred.job.queue.name</name>
243
                <value>${queueName}</value>
244
            </property>
245
		</configuration>
246
	</global>
247
	
248
	<start to="import" />
249

    
250
	<action name="import">
251
	    <sub-workflow>
252
            <app-path>${wf:appPath()}/common_import</app-path>
253
            <propagate-configuration/>
254
            <configuration>
255
            	<property>
256
                    <name>workingDir</name>
257
                    <value>${workingDir}/common_import/working_dir</value>
258
                </property>
259
                <!-- importing modes -->
260
				<property>
261
					<name>active_import_metadata</name>
262
					<value>true</value>
263
				</property>
264
				<property>
265
					<name>active_import_dataset</name>
266
					<value>${active_referenceextraction_dataset}</value>
267
				</property>
268
				<property>
269
					<name>active_ingest_pmc_citations</name>
270
					<value>${active_citationmatching}</value>
271
				</property>
272
                <!-- import metadata related -->
273
				<property>
274
					<name>hbase_input_table</name>
275
					<value>${import_hbase_input_table}</value>
276
				</property>
277
				<property>
278
					<name>hbase_approved_datasources_csv</name>
279
					<value>${import_hbase_approved_datasources_csv}</value>
280
				</property>
281
				<!-- import datacite related -->
282
				<property>
283
					<name>mdstore_service_location</name>
284
					<value>${import_mdstore_service_location}</value>
285
				</property>
286
				<property>
287
					<name>dataset_mdstore_ids_csv</name>
288
					<value>${import_dataset_mdstore_ids_csv}</value>
289
				</property>
290
				<!-- import content related -->
291
				<property>
292
					<name>objectstore_service_location</name>
293
					<value>${import_content_object_store_location}</value>
294
				</property>
295
				<property>
296
					<name>approved_objectstores_csv</name>
297
					<value>${import_content_objectstores_csv}</value>
298
				</property>
299
				<property>
300
					<name>mimetypes_pdf</name>
301
					<value>${import_content_mimetypes_pdf}</value>
302
				</property>
303
				<property>
304
					<name>mimetypes_text</name>
305
					<value>${import_content_mimetypes_text}</value>
306
				</property>
307
				<property>
308
					<name>mimetypes_xml_pmc</name>
309
					<value>${import_content_mimetypes_xml_pmc}</value>
310
				</property>
311
				<property>
312
					<name>mimetypes_wos</name>
313
					<value>${import_content_mimetypes_wos}</value>
314
				</property>
315
				<!-- import timeouts related -->
316
				<property>
317
					<name>resultset_client_read_timeout</name>
318
					<value>${import_resultset_client_read_timeout}</value>
319
				</property>
320
				<property>
321
					<name>content_connection_timeout</name>
322
					<value>${import_content_connection_timeout}</value>
323
				</property>
324
				<property>
325
					<name>content_read_timeout</name>
326
					<value>${import_content_read_timeout}</value>
327
				</property>
328
				<!-- metadata extraction related -->
329
				<property>
330
					<name>metadataextraction_excluded_ids</name>
331
					<value>${metadataextraction_excluded_ids}</value>
332
				</property>
333
				<property>
334
					<name>metadataextraction_default_cache_location</name>
335
					<value>${metadataextraction_default_cache_location}</value>
336
				</property>
337
				<!-- metadatainput and metadataextraction output subdirectory names -->
338
				<property>
339
					<name>metadataextraction_output_name_meta</name>
340
					<value>meta</value>
341
				</property>
342
				<property>
343
					<name>metadataimport_output_name_document_meta</name>
344
					<value>docmeta</value>
345
				</property>
346
				<property>
347
					<name>metadataimport_output_name_document_project</name>
348
					<value>docproject</value>
349
				</property>
350
				<property>
351
					<name>metadataimport_output_name_document_relation</name>
352
					<value>docrelation</value>
353
				</property>
354
				<property>
355
					<name>metadataimport_output_name_project</name>
356
					<value>project</value>
357
				</property>
358
				<property>
359
					<name>metadataimport_output_name_person</name>
360
					<value>person</value>
361
				</property>
362
				<property>
363
					<name>metadataimport_output_name_dataset_id</name>
364
					<value>datasetid</value>
365
				</property>
366
				<property>
367
					<name>metadataimport_output_name_dedup_mapping</name>
368
					<value>dedupmapping</value>
369
				</property>
370
				<!-- output parameters -->
371
				<property>
372
					<name>output_metadataextraction_root</name>
373
					<value>${workingDir}/common_import/metadataextraction</value>
374
				</property>
375
				<property>
376
					<name>output_metadataimport_root</name>
377
					<value>${workingDir}/common_import/metadataimport</value>
378
				</property>
379
				<property>
380
					<name>output_citation_pmc</name>
381
					<value>${workingDir}/common_import/citation_pmc</value>
382
				</property>
383
				<property>
384
					<name>output_dataset</name>
385
					<value>${workingDir}/common_import/dataset</value>
386
				</property>
387
				<property>
388
					<name>output_citation_pmc</name>
389
					<value>${workingDir}/common_import/citation_pmc</value>
390
				</property>
391
				<property>
392
					<name>output_document_text</name>
393
					<value>${workingDir}/common_import/document-text</value>
394
				</property>
395
				<property>
396
					<name>output_wos</name>
397
					<value>${workingDir}/common_import/wos</value>
398
				</property>
399
            </configuration>
400
        </sub-workflow>
401
		<ok to="mainworkflows_primary_processing"/>
402
		<error to="fail" />
403
    </action>
404

    
405
	<action name="mainworkflows_primary_processing">
406
		<sub-workflow>
407
            <app-path>${wf:appPath()}/primary_processing</app-path>
408
            <propagate-configuration/>
409
            <configuration>
410
            	<property>
411
                    <name>input_document_metadata</name>
412
                    <value>${workingDir}/common_import/metadataimport/docmeta</value>
413
                </property>
414
                <property>
415
                    <name>input_document_to_project</name>
416
                    <value>${workingDir}/common_import/metadataimport/docproject</value>
417
                </property>
418
                <property>
419
                    <name>input_document_text</name>
420
                    <value>${workingDir}/common_import/document-text</value>
421
                </property>
422
                <property>
423
                    <name>input_document_text_wos</name>
424
                    <value>${workingDir}/common_import/wos</value>
425
                </property>
426
                <property>
427
                    <name>input_project</name>
428
                    <value>${workingDir}/common_import/metadataimport/project</value>
429
                </property>
430
                <property>
431
                    <name>input_person</name>
432
                    <value>${workingDir}/common_import/metadataimport/person</value>
433
                </property>
434
                <property>
435
                    <name>input_dataset</name>
436
                    <value>${workingDir}/common_import/dataset</value>
437
                </property>
438
                <property>
439
					<name>input_extracted_document_metadata</name>
440
					<value>${workingDir}/common_import/metadataextraction/meta</value>
441
				</property>
442
				<property>
443
					<name>input_citation_pmc</name>
444
					<value>${workingDir}/common_import/citation_pmc</value>
445
				</property>
446
				<property>
447
                    <name>output_document_to_project</name>
448
                    <value>${workingDir}/exported_to_be_cleaned/document_to_project</value>
449
                </property>
450
                <property>
451
                    <name>output_document_to_dataset</name>
452
                    <value>${workingDir}/exported_to_be_cleaned/document_to_dataset</value>
453
                </property>
454
                <property>
455
                    <name>output_document_to_research_initiatives</name>
456
                    <value>${workingDir}/exported/document_to_research_initiatives</value>
457
                </property>
458
                <property>
459
                    <name>output_document_to_document_classes</name>
460
                    <value>${workingDir}/exported/document_to_document_classes</value>
461
                </property>
462
                <property>
463
                    <name>output_citation</name>
464
                    <value>${workingDir}/exported/citation</value>
465
                </property>
466
                <property>
467
                    <name>output_document_similarity</name>
468
                    <value>${workingDir}/exported/document_similarity</value>
469
                </property>
470
				<property>
471
                    <name>output_document_statistics</name>
472
                    <value>${workingDir}/exported/document_statistics</value>
473
                </property>                
474
                <property>
475
                    <name>output_author_statistics</name>
476
                    <value>${workingDir}/exported/author_statistics</value>
477
                </property>
478
                <property>
479
                    <name>output_project_statistics</name>
480
                    <value>${workingDir}/exported/project_statistics</value>
481
                </property>
482
            </configuration>
483
        </sub-workflow>
484
        <!-- 
485
        <ok to="transformers_export_document_skip_imported_data"/>
486
         -->
487
		<ok to="decision-transform-metadataextraction-for-export"/>
488
		<error to="fail" />
489
	</action>
490
    
491
    <decision name="decision-transform-metadataextraction-for-export">
492
        <switch>
493
            <case to="transformer_export_documentmetadata">${active_metadataextraction_export eq "true"}</case>
494
            <default to="skip-transformer_export_documentmetadata"/>
495
        </switch>
496
    </decision>
497
    
498
    <action name="transformer_export_documentmetadata">
499
        <sub-workflow>
500
            <app-path>${wf:appPath()}/transformer_export_documentmetadata</app-path>
501
            <configuration>
502
                <property>
503
                    <name>jobTracker</name>
504
                    <value>${jobTracker}</value>
505
                </property>
506
                <property>
507
                    <name>nameNode</name>
508
                    <value>${nameNode}</value>
509
                </property>
510
                <property>
511
                    <name>queueName</name>
512
                    <value>${queueName}</value>
513
                </property>
514
                <!-- Working directory of the subworkflow -->
515
                <property>
516
                    <name>workingDir</name>
517
                    <value>${workingDir}/transformer_export_documentmetadata/working_dir</value>
518
                </property>
519
                <property>
520
                    <name>input_extracted_metadata</name>
521
                    <value>${workingDir}/common_import/metadataextraction/meta</value>
522
                </property>
523
                <property>
524
                    <name>output_metadata</name>
525
                    <value>${workingDir}/transformer_export_documentmetadata/output_metadata</value>
526
                </property>
527
            </configuration>
528
        </sub-workflow>
529
        <ok to="forking_skip_imported_data"/>
530
        <error to="fail"/>
531
    </action>
532
    
533
    <action name="skip-transformer_export_documentmetadata">
534
        <java>
535
			<prepare>
536
				<!-- notice: directory have to aligned with skipped action output -->
537
				<delete path="${nameNode}${workingDir}/transformer_export_documentmetadata" />
538
				<mkdir path="${nameNode}${workingDir}/transformer_export_documentmetadata/working_dir" />
539
			</prepare>
540
			<main-class>eu.dnetlib.iis.core.java.ProcessWrapper</main-class>
541
			<arg>eu.dnetlib.iis.core.java.jsonworkflownodes.Producer</arg>
542
            <arg>-C{document_metadata,
543
				eu.dnetlib.iis.export.schemas.DocumentMetadata,
544
				eu/dnetlib/iis/mainworkflows/data/empty.json}</arg>
545
            <arg>-SworkingDir=${workingDir}/transformer_export_documentmetadata/working_dir</arg>
546
            <!-- notice: directory have to aligned with skipped action output -->
547
            <arg>-Odocument_metadata=${workingDir}/transformer_export_documentmetadata/output_metadata</arg>
548
        </java>
549
        <ok to="forking_skip_imported_data"/>
550
        <error to="fail"/>
551
    </action>
552
    
553
    <fork name="forking_skip_imported_data">
554
    	<path start="transformer_export_documenttodataset"/>
555
    	<path start="transformer_export_documenttoproject"/>
556
    </fork>
557
    
558
    <action name="transformer_export_documenttodataset">
559
	    <sub-workflow>
560
            <app-path>${wf:appPath()}/transformer_export_documenttodataset_without_imported_data</app-path>
561
            <propagate-configuration/>
562
            <configuration>
563
				<property>
564
                    <name>workingDir</name>
565
                    <value>${workingDir}/transformer_export_documenttodataset_without_imported_data/working_dir</value>
566
                </property>
567
                <property>
568
					<name>input_document_to_dataset</name>
569
					<value>${workingDir}/exported_to_be_cleaned/document_to_dataset</value>
570
				</property>
571
				<property>
572
					<name>input_document_relation</name>
573
					<value>${workingDir}/common_import/metadataimport/docrelation</value>
574
				</property>
575
				<property>
576
					<name>output_document_to_dataset</name>
577
					<value>${workingDir}/transformer_export_documenttodataset_without_imported_data/output</value>
578
				</property>
579
            </configuration>
580
        </sub-workflow>
581
		<ok to="joining_skip_imported_data"/>
582
		<error to="fail" />
583
    </action>
584
    
585
    <action name="transformer_export_documenttoproject">
586
	    <sub-workflow>
587
            <app-path>${wf:appPath()}/transformer_export_documenttoproject_without_imported_data</app-path>
588
            <propagate-configuration/>
589
            <configuration>
590
				<property>
591
                    <name>workingDir</name>
592
                    <value>${workingDir}/transformer_export_documenttoproject_without_imported_data/working_dir</value>
593
                </property>
594
                <property>
595
					<name>input_document_to_project</name>
596
					<value>${workingDir}/exported_to_be_cleaned/document_to_project</value>
597
				</property>
598
				<property>
599
					<name>input_imported_document_to_project</name>
600
					<value>${workingDir}/common_import/metadataimport/docproject</value>
601
				</property>
602
				<property>
603
					<name>output_document_to_project</name>
604
					<value>${workingDir}/transformer_export_documenttoproject_without_imported_data/output</value>
605
				</property>
606
            </configuration>
607
        </sub-workflow>
608
		<ok to="joining_skip_imported_data"/>
609
		<error to="fail" />
610
    </action>
611
    
612
    <join name="joining_skip_imported_data" to="export"/>
613
    
614
    <action name="export">
615
		<sub-workflow>
616
            <app-path>${wf:appPath()}/common_export</app-path>
617
            <propagate-configuration/>
618
            <configuration>
619
            	<property>
620
                    <name>workingDir</name>
621
                    <value>${workingDir}/common_export/working_dir</value>
622
                </property>
623
                <!-- input ports -->
624
                <property>
625
					<name>input_document_metadata</name>
626
					<value>${workingDir}/transformer_export_documentmetadata/output_metadata</value>
627
				</property>
628
                <property>
629
					<name>input_document_to_project</name>
630
					<value>${workingDir}/transformer_export_documenttoproject_without_imported_data/output</value>
631
				</property>
632
				<property>
633
					<name>input_document_to_dataset</name>
634
					<value>${workingDir}/transformer_export_documenttodataset_without_imported_data/output</value>
635
				</property>
636
				<property>
637
					<name>input_document_to_research_initiatives</name>
638
					<value>${workingDir}/exported/document_to_research_initiatives</value>
639
				</property>
640
				<property>
641
					<name>input_document_to_document_classes</name>
642
					<value>${workingDir}/exported/document_to_document_classes</value>
643
				</property>
644
				<!-- FIXME provide input_citations port
645
					currently citation outcome is not exported 
646
					make sure skipping citationmatching is properly handled
647
					-->
648
				<!-- 
649
				<property>
650
					<name>input_citation</name>
651
					<value>${workingDir}/exported/citation</value>
652
				</property>
653
				 -->
654
				<property>
655
					<name>input_document_similarity</name>
656
					<value>${workingDir}/exported/document_similarity</value>
657
				</property>
658
				<property>
659
					<name>input_document_statistics</name>
660
					<value>${workingDir}/exported/document_statistics</value>
661
				</property>
662
				<property>
663
					<name>input_author_statistics</name>
664
					<value>${workingDir}/exported/author_statistics</value>
665
				</property>
666
				<property>
667
					<name>input_project_statistics</name>
668
					<value>${workingDir}/exported/project_statistics</value>
669
				</property>
670
				<property>
671
					<name>input_aux_dataset_existing_id</name>
672
					<value>${workingDir}/common_import/metadataimport/datasetid</value>
673
				</property>
674
				<!-- entities exporting modes -->
675
				<property>
676
					<name>active_export_referenceddataset_datasets</name>
677
					<value>${active_referenceextraction_dataset}</value>
678
				</property>
679
				<property>
680
					<name>active_export_referencedproject_entities</name>
681
					<value>false</value>
682
				</property>
683
				<property>
684
					<name>mdstore_service_location</name>
685
					<value>${import_mdstore_service_location}</value>
686
				</property>
687
				<property>
688
					<name>dataset_mdstore_ids_csv</name>
689
					<value>${import_dataset_mdstore_ids_csv}</value>
690
				</property>
691
				<!-- export related -->
692
				<property>
693
					<name>action_hbase_table_name</name>
694
					<value>${export_action_hbase_table_name}</value>
695
				</property>
696
				<property>
697
					<name>action_hbase_table_initialize</name>
698
					<value>${export_action_hbase_table_initialize}</value>
699
				</property>
700
				<!-- action set id properties -->
701
				<property>
702
					<name>action_set_id</name>
703
					<value>${export_action_set_id}</value>
704
				</property>
705
				<property>
706
					<name>action_set_id_dataset_similarities_websiteusage</name>
707
					<value>${export_action_set_id_dataset_similarities_websiteusage}</value>
708
				</property>
709
				<property>
710
					<name>action_set_id_person_similarities_websiteusage</name>
711
					<value>${export_action_set_id_person_similarities_websiteusage}</value>
712
				</property>
713
				<property>
714
					<name>action_set_id_person_statistics</name>
715
					<value>${export_action_set_id_person_statistics}</value>
716
				</property>
717
				<property>
718
					<name>action_set_id_project_statistics</name>
719
					<value>${export_action_set_id_project_statistics}</value>
720
				</property>
721
				<property>
722
					<name>action_set_id_document_similarities_standard</name>
723
					<value>${export_action_set_id_document_similarities_standard}</value>
724
				</property>
725
				<property>
726
					<name>action_set_id_document_similarities_websiteusage</name>
727
					<value>${export_action_set_id_document_similarities_websiteusage}</value>
728
				</property>
729
				<property>
730
					<name>action_set_id_document_extractedMetadata</name>
731
					<value>${export_action_set_id_document_extractedMetadata}</value>
732
				</property>
733
				<property>
734
					<name>action_set_id_document_statistics</name>
735
					<value>${export_action_set_id_document_statistics}</value>
736
				</property>
737
				<property>
738
					<name>action_set_id_document_classes</name>
739
					<value>${export_action_set_id_document_classes}</value>
740
				</property>
741
				<property>
742
					<name>action_set_id_document_referencedProjects</name>
743
					<value>${export_action_set_id_document_referencedProjects}</value>
744
				</property>
745
				<property>
746
					<name>action_set_id_document_referencedDatasets</name>
747
					<value>${export_action_set_id_document_referencedDatasets}</value>
748
				</property>
749
				<property>
750
					<name>action_set_id_document_referencedDocuments</name>
751
					<value>${export_action_set_id_document_referencedDocuments}</value>
752
				</property>
753
				<property>
754
					<name>action_set_id_document_research_initiative</name>
755
					<value>${export_action_set_id_document_research_initiative}</value>
756
				</property>
757
				<property>
758
					<name>action_set_id_entity_dataset</name>
759
					<value>${export_action_set_id_entity_dataset}</value>
760
				</property>
761
				<property>
762
					<name>action_hbase_remote_zookeeper_quorum</name>
763
					<value>${export_action_hbase_remote_zookeeper_quorum}</value>
764
				</property>
765
				<property>
766
					<name>action_hbase_remote_zookeeper_clientport</name>
767
					<value>${export_action_hbase_remote_zookeeper_clientport}</value>
768
				</property>
769
				<property>
770
					<name>documentssimilarity_threshold</name>
771
					<value>${export_documentssimilarity_threshold}</value>
772
				</property>
773
            </configuration>
774
        </sub-workflow>
775
		<ok to="end"/>
776
		<error to="fail" />
777
	</action>
778
    
779
	<kill name="fail">
780
		<message>Unfortunately, the process failed -- error message:
781
			[${wf:errorMessage(wf:lastErrorNode())}]</message>
782
	</kill>
783
	<end name="end" />
784
</workflow-app>
(2-2/2)