1 |
26600
|
sandro.lab
|
<RESOURCE_PROFILE>
|
2 |
39556
|
claudio.at
|
<HEADER>
|
3 |
|
|
<RESOURCE_IDENTIFIER
|
4 |
|
|
value="732656e3-5ac6-4344-9d1f-f5c805f53a06_SGFkb29wSm9iQ29uZmlndXJhdGlvbkRTUmVzb3VyY2VzL0hhZG9vcEpvYkNvbmZpZ3VyYXRpb25EU1Jlc291cmNlVHlwZQ=="/>
|
5 |
|
|
<RESOURCE_TYPE value="HadoopJobConfigurationDSResourceType"/>
|
6 |
|
|
<RESOURCE_KIND value="HadoopJobConfigurationDSResources"/>
|
7 |
|
|
<RESOURCE_URI value=""/>
|
8 |
|
|
<DATE_OF_CREATION value="2001-12-31T12:00:00"/>
|
9 |
|
|
</HEADER>
|
10 |
|
|
<BODY>
|
11 |
|
|
<HADOOP_JOB name="iisPreprocessingJob" type="oozie">
|
12 |
|
|
<DESCRIPTION>IIS preprocessing</DESCRIPTION>
|
13 |
|
|
<STATIC_CONFIGURATION>
|
14 |
26600
|
sandro.lab
|
<!-- Cluster wide -->
|
15 |
39556
|
claudio.at
|
<PROPERTY key="queueName" value="default"/>
|
16 |
|
|
<PROPERTY key="user.name" value="dnet.beta"/>
|
17 |
26600
|
sandro.lab
|
|
18 |
|
|
<!-- Runtime -->
|
19 |
39556
|
claudio.at
|
<PROPERTY key="workingDir" value="/tmp/integration/working_dir/preprocessing"/>
|
20 |
|
|
<PROPERTY key="oozie.wf.application.path" value="/tmp/integration/apps/preprocessing"/>
|
21 |
|
|
<PROPERTY key="oozie.wf.validate.ForkJoin" value="false"/>
|
22 |
27525
|
claudio.at
|
<PROPERTY key="export_action_hbase_table_initialize" value="false"/>
|
23 |
40246
|
claudio.at
|
<!-- <PROPERTY key="metadataextraction_default_cache_location" value="/cache/metadataextraction"/> -->
|
24 |
|
|
<PROPERTY key="metadataextraction_default_cache_location" value="/cache/metadataextraction_updated_model"/>
|
25 |
39556
|
claudio.at
|
<PROPERTY key="metadataextraction_excluded_checksums"
|
26 |
|
|
value="1e5b574109da731f4918c7f91fc24864,bea4728578070c3d66774bf9454d41fe,da458477233b5561ae47042aa2a73086"/>
|
27 |
40510
|
alessia.ba
|
<PROPERTY key="export_trust_level_threshold_document_referencedDatasets" value="0.0"/>
|
28 |
|
|
<PROPERTY key="export_trust_level_threshold_document_referencedProjects" value="0.0"/>
|
29 |
43379
|
claudio.at
|
<PROPERTY key="output_remote_location" value="hdfs://namenode.hadoop.dm.openaire.eu/var/lib/dnet/actionManager_BETA"/>
|
30 |
39556
|
claudio.at
|
</STATIC_CONFIGURATION>
|
31 |
|
|
<JOB_INTERFACE>
|
32 |
|
|
<PARAM name="import_content_object_store_location" required="true" description="mdstore service location"/>
|
33 |
|
|
<PARAM name="import_mdstore_service_location" required="true" description="mdstore service location"/>
|
34 |
|
|
<PARAM name="import_dataset_mdstore_ids_csv" required="true" description="mdstore id for dataset records"/>
|
35 |
|
|
<PARAM name="import_wos_mdstore_id" required="true" description="mdstore id for WoS records"/>
|
36 |
|
|
<PARAM name="import_database_service_location" required="true" description="database service endpoint"/>
|
37 |
|
|
<PARAM name="import_content_datacite_objectstores_csv" required="true" description="objecstore ids subject to dataset reference extraction"/>
|
38 |
|
|
<PARAM name="import_content_wos_plaintext_objectstores_csv" required="true" description="objecstore ids for WoS plaintext"/>
|
39 |
|
|
<PARAM name="export_action_hbase_table_name" required="true" description="destination action manager table"/>
|
40 |
|
|
<PARAM name="export_action_hbase_remote_zookeeper_quorum" required="true" description="ZK quorum"/>
|
41 |
|
|
<PARAM name="export_action_hbase_remote_zookeeper_clientport" required="true" description="ZK port"/>
|
42 |
|
|
<PARAM name="nameNode" required="true" description="hdfs name node"/>
|
43 |
|
|
<PARAM name="jobTracker" required="true" description="job tracker name"/>
|
44 |
|
|
<PARAM name="oozie.wf.application.path" required="true" description="oozie job application absolute path"/>
|
45 |
|
|
<PARAM name="export_action_set_id_document_referencedProjects" required="true" description="target action set for project references"/>
|
46 |
|
|
<PARAM name="export_action_set_id_document_referencedDatasets" required="true" description="target action set for dataset references"/>
|
47 |
|
|
<PARAM name="export_action_set_id_entity_wos" required="true" description="target action set for WoS entities"/>
|
48 |
|
|
<PARAM name="export_action_set_id_entity_dataset" required="true" description="target action set for dataset entities"/>
|
49 |
|
|
</JOB_INTERFACE>
|
50 |
|
|
</HADOOP_JOB>
|
51 |
|
|
<STATUS>
|
52 |
|
|
<LAST_SUBMISSION_DATE value="2001-12-31T12:00:00"/>
|
53 |
|
|
<RUNNING_INSTANCES value="0"/>
|
54 |
|
|
<CUMULATIVE_RUN value="0"/>
|
55 |
|
|
</STATUS>
|
56 |
|
|
<SECURITY_PARAMETERS>SECURITY_PARAMETERS</SECURITY_PARAMETERS>
|
57 |
|
|
</BODY>
|
58 |
26600
|
sandro.lab
|
</RESOURCE_PROFILE>
|