Revision 30981
Added by Marek Horst about 10 years ago
modules/icm-iis-mainworkflows/trunk/src/main/resources/eu/dnetlib/iis/mainworkflows/importer/content_url/job.properties | ||
---|---|---|
1 |
objectstore_service_location=http://node6.t.openaire.research-infrastructures.eu:8280/is/services/objectStore
|
|
1 |
objectstore_service_location=http://openaire-services.vls.icm.edu.pl:8280/is/services/objectStore
|
|
2 | 2 |
|
3 | 3 |
#empty |
4 |
approved_objectstores_csv=$UNDEFINED$ |
|
4 |
#approved_objectstores_csv=$UNDEFINED$
|
|
5 | 5 |
#puma |
6 |
#approved_objectstores_csv=794e8173-8be3-4f51-a12e-b43d12ab3b7d_T2JqZWN0U3RvcmVEU1Jlc291cmNlcy9PYmplY3RTdG9yZURTUmVzb3VyY2VUeXBl
|
|
6 |
approved_objectstores_csv=794e8173-8be3-4f51-a12e-b43d12ab3b7d_T2JqZWN0U3RvcmVEU1Jlc291cmNlcy9PYmplY3RTdG9yZURTUmVzb3VyY2VUeXBl |
|
7 | 7 |
#arxiv |
8 | 8 |
#approved_objectstores_csv=258755af-0b48-41ee-9652-939c5bd2fca3_T2JqZWN0U3RvcmVEU1Jlc291cmNlcy9PYmplY3RTdG9yZURTUmVzb3VyY2VUeXBl |
9 | 9 |
#updated europe PMC |
... | ... | |
13 | 13 |
#all 4 |
14 | 14 |
#approved_objectstores_csv=794e8173-8be3-4f51-a12e-b43d12ab3b7d_T2JqZWN0U3RvcmVEU1Jlc291cmNlcy9PYmplY3RTdG9yZURTUmVzb3VyY2VUeXBl,258755af-0b48-41ee-9652-939c5bd2fca3_T2JqZWN0U3RvcmVEU1Jlc291cmNlcy9PYmplY3RTdG9yZURTUmVzb3VyY2VUeXBl,b2b6fca5-ce18-498c-a375-b02df97998f0_T2JqZWN0U3RvcmVEU1Jlc291cmNlcy9PYmplY3RTdG9yZURTUmVzb3VyY2VUeXBl,a1a35f9d-dc12-44e0-8781-d8273f5ef017_T2JqZWN0U3RvcmVEU1Jlc291cmNlcy9PYmplY3RTdG9yZURTUmVzb3VyY2VUeXBl |
15 | 15 |
|
16 |
|
|
17 | 16 |
#approved_datasources_csv=$UNDEFINED$ |
18 | 17 |
#lookup_service_location=$UNDEFINED$ |
19 | 18 |
|
modules/icm-iis-mainworkflows/trunk/src/main/resources/eu/dnetlib/iis/mainworkflows/metadataextraction/cached_by_checksum/job.properties | ||
---|---|---|
1 | 1 |
#iis cluster |
2 |
input=/share/import/doc_content_url/puma/2014-06-19
|
|
3 |
default_cache_location=/cache/metadataextraction_test
|
|
2 |
input=/share/import/doc_content_url/puma/2014-09-26
|
|
3 |
default_cache_location=/cache/metadataextraction_2014-09-26
|
|
4 | 4 |
|
5 | 5 |
excluded_ids=$UNDEFINED$ |
6 | 6 |
|
modules/icm-iis-mainworkflows/trunk/src/main/resources/eu/dnetlib/iis/mainworkflows/preprocessing/main/job.properties | ||
---|---|---|
40 | 40 |
metadataextraction_default_cache_location=/cache/metadataextraction |
41 | 41 |
|
42 | 42 |
#export |
43 |
export_action_hbase_table_name=db_actions_preprocessing |
|
43 |
export_action_hbase_table_name=db_actions_preprocessing_test
|
|
44 | 44 |
export_action_hbase_table_initialize=true |
45 | 45 |
#export actionset id related |
46 | 46 |
#export_action_set_id=preprocessing |
modules/icm-iis-mainworkflows/trunk/src/main/resources/eu/dnetlib/iis/mainworkflows/primary/main/job.properties | ||
---|---|---|
37 | 37 |
|
38 | 38 |
#processing modes |
39 | 39 |
active_metadataextraction_export=false |
40 |
active_referenceextraction_project=true
|
|
41 |
active_referenceextraction_dataset=true
|
|
42 |
active_referenceextraction_researchinitiative=true
|
|
43 |
active_documentsclassification=true
|
|
44 |
active_documentssimilarity=true
|
|
40 |
active_referenceextraction_project=false
|
|
41 |
active_referenceextraction_dataset=false
|
|
42 |
active_referenceextraction_researchinitiative=false
|
|
43 |
active_documentsclassification=false
|
|
44 |
active_documentssimilarity=false
|
|
45 | 45 |
active_citationmatching=true |
46 | 46 |
active_statistics=false |
47 | 47 |
|
48 | 48 |
#export |
49 | 49 |
export_action_hbase_table_name=mainworkflows_primary_test |
50 | 50 |
export_action_hbase_table_initialize=true |
51 |
export_action_set_id=iis-default |
|
51 |
#export_action_set_id=iis-default
|
|
52 | 52 |
export_action_set_id_entity_dataset=iis-dataset-entities |
53 | 53 |
#exporting to external CNR cluster |
54 | 54 |
#export_action_hbase_remote_zookeeper_quorum=jobtracker.t.hadoop.research-infrastructures.eu:2182,quorum1.t.hadoop.research-infrastructures.eu:2182,quorum2.t.hadoop.research-infrastructures.eu:2182,quorum3.t.hadoop.research-infrastructures.eu:2182,quorum4.t.hadoop.research-infrastructures.eu:2182 |
modules/icm-iis-mainworkflows/trunk/src/main/resources/eu/dnetlib/iis/mainworkflows/common/import/job.properties | ||
---|---|---|
1 |
active_import_metadata=false
|
|
1 |
active_import_metadata=true
|
|
2 | 2 |
active_import_dataset=false |
3 | 3 |
|
4 |
hbase_input_table=information_space-2014-06-10
|
|
5 |
database_service_location=http://node6.t.openaire.research-infrastructures.eu:8280/is/services/database
|
|
4 |
hbase_input_table=information_space-2014-06-27
|
|
5 |
database_service_location=http://openaire-services.vls.icm.edu.pl:8280/is/services/database
|
|
6 | 6 |
|
7 |
objectstore_service_location=http://node6.t.openaire.research-infrastructures.eu:8280/is/services/objectStore
|
|
7 |
objectstore_service_location=http://openaire-services.vls.icm.edu.pl:8280/is/services/objectStore
|
|
8 | 8 |
#approved_objectstores_csv=$UNDEFINED$ |
9 | 9 |
#puma |
10 | 10 |
approved_objectstores_csv=794e8173-8be3-4f51-a12e-b43d12ab3b7d_T2JqZWN0U3RvcmVEU1Jlc291cmNlcy9PYmplY3RTdG9yZURTUmVzb3VyY2VUeXBl |
11 |
#arxiv content |
|
12 |
#approved_objectstores_csv=258755af-0b48-41ee-9652-939c5bd2fca3_T2JqZWN0U3RvcmVEU1Jlc291cmNlcy9PYmplY3RTdG9yZURTUmVzb3VyY2VUeXBl |
|
13 |
#pmc content |
|
14 |
#approved_objectstores_csv=b2b6fca5-ce18-498c-a375-b02df97998f0_T2JqZWN0U3RvcmVEU1Jlc291cmNlcy9PYmplY3RTdG9yZURTUmVzb3VyY2VUeXBl |
|
11 | 15 |
#wos |
12 | 16 |
#przetestowac czy plaintexty wos sa prawidlowo wyciagane zarowno w trybie sprawdzania instenia jak i bez tego trybu |
13 | 17 |
#approved_objectstores_csv=a1a35f9d-dc12-44e0-8781-d8273f5ef017_T2JqZWN0U3RvcmVEU1Jlc291cmNlcy9PYmplY3RTdG9yZURTUmVzb3VyY2VUeXBl |
14 | 18 |
|
15 |
metadataextraction_default_cache_location=/share/cache/metadataextraction/puma/2014-06-23
|
|
19 |
metadataextraction_default_cache_location=/cache/metadataextraction_2014-09-26
|
|
16 | 20 |
|
17 | 21 |
mimetypes_pdf=pdf,application/pdf |
18 | 22 |
mimetypes_text=text |
Also available in: Unified diff
updating job properties