Revision 31498
Added by Marek Horst about 10 years ago
modules/icm-iis-mainworkflows/trunk/src/main/resources/eu/dnetlib/iis/mainworkflows/common/import/job.properties | ||
---|---|---|
17 | 17 |
#przetestowac czy plaintexty wos sa prawidlowo wyciagane zarowno w trybie sprawdzania instenia jak i bez tego trybu |
18 | 18 |
#approved_objectstores_csv=a1a35f9d-dc12-44e0-8781-d8273f5ef017_T2JqZWN0U3RvcmVEU1Jlc291cmNlcy9PYmplY3RTdG9yZURTUmVzb3VyY2VUeXBl |
19 | 19 |
|
20 |
metadataextraction_default_cache_location=/cache/metadataextraction_2014-09-26
|
|
20 |
metadataextraction_default_cache_location=/cache/metadataextraction |
|
21 | 21 |
|
22 | 22 |
mimetypes_pdf=pdf,application/pdf |
23 | 23 |
mimetypes_text=text |
modules/icm-iis-mainworkflows/trunk/src/main/resources/eu/dnetlib/iis/mainworkflows/common/import/oozie_app/import.txt | ||
---|---|---|
10 | 10 |
metadataextraction_cached classpath eu/dnetlib/iis/mainworkflows/metadataextraction/cached_by_checksum/oozie_app |
11 | 11 |
transformers_common_union3 classpath eu/dnetlib/iis/transformers/common/union3/oozie_app |
12 | 12 |
transformers_idextractor classpath eu/dnetlib/iis/transformers/importer/documentmetadata/idextractor/oozie_app |
13 |
transformers_externalidtooaid classpath eu/dnetlib/iis/transformers/importer/documentmetadata/externalidtooaid/oozie_app |
|
13 |
transformers_externalidtooaid classpath eu/dnetlib/iis/transformers/importer/documentmetadata/externalidtooaid/oozie_app |
|
14 |
ingest_pmc_idmapping_pmidtooaid classpath eu/dnetlib/iis/ingest/pmc/idmapping/pmidtooaid/oozie_app |
modules/icm-iis-mainworkflows/trunk/src/main/resources/eu/dnetlib/iis/mainworkflows/common/import/oozie_app/workflow.xml | ||
---|---|---|
691 | 691 |
</property> |
692 | 692 |
</configuration> |
693 | 693 |
</sub-workflow> |
694 |
<ok to="generate_pmid_to_oaid_mocked_input"/>
|
|
694 |
<ok to="ingest_pmc_idmapping_pmidtooaid"/>
|
|
695 | 695 |
<error to="fail"/> |
696 | 696 |
</action> |
697 | 697 |
|
698 |
<action name="generate_pmid_to_oaid_mocked_input"> |
|
699 |
<java> |
|
700 |
<job-tracker>${jobTracker}</job-tracker> |
|
701 |
<name-node>${nameNode}</name-node> |
|
702 |
<!-- The data generated by this node is deleted in this section --> |
|
703 |
<prepare> |
|
704 |
<delete path="${nameNode}${workingDir}/pmid_to_oaid_producer" /> |
|
705 |
<mkdir path="${nameNode}${workingDir}/pmid_to_oaid_producer" /> |
|
706 |
</prepare> |
|
698 |
<action name="ingest_pmc_idmapping_pmidtooaid"> |
|
699 |
<sub-workflow> |
|
700 |
<app-path>${wf:appPath()}/ingest_pmc_idmapping_pmidtooaid</app-path> |
|
701 |
<propagate-configuration/> |
|
707 | 702 |
<configuration> |
708 | 703 |
<property> |
709 |
<name>mapred.job.queue.name</name>
|
|
710 |
<value>${queueName}</value>
|
|
704 |
<name>workingDir</name>
|
|
705 |
<value>${workingDir}/ingest_pmc_idmapping_pmidtooaid/working_dir</value>
|
|
711 | 706 |
</property> |
707 |
<property> |
|
708 |
<name>input_document_nlm</name> |
|
709 |
<value>${workingDir}/import_plaintext_pmc/imported</value> |
|
710 |
</property> |
|
711 |
<property> |
|
712 |
<name>output</name> |
|
713 |
<value>${workingDir}/ingest_pmc_idmapping_pmidtooaid/out</value> |
|
714 |
</property> |
|
712 | 715 |
</configuration> |
713 |
<!-- This is simple wrapper for the Java code --> |
|
714 |
<main-class>eu.dnetlib.iis.core.java.ProcessWrapper</main-class> |
|
715 |
<!-- The business Java code that gets to be executed --> |
|
716 |
<arg>eu.dnetlib.iis.core.java.jsonworkflownodes.Producer</arg> |
|
717 |
<!-- Specification of the output ports --> |
|
718 |
<arg>-C{pmid_to_oaid, |
|
719 |
eu.dnetlib.iis.common.schemas.IdentifierMapping, |
|
720 |
eu/dnetlib/iis/mainworkflows/data/empty.json}</arg> |
|
721 |
<arg>-SworkingDir=${workingDir}/pmid_to_oaid_producer/working_dir</arg> |
|
722 |
<arg>-Opmid_to_oaid=${workingDir}/pmid_to_oaid_producer/pmid_to_oaid</arg> |
|
723 |
</java> |
|
716 |
</sub-workflow> |
|
724 | 717 |
<ok to="ingest_pmc_citations"/> |
725 | 718 |
<error to="fail"/> |
726 | 719 |
</action> |
... | ... | |
748 | 741 |
</property> |
749 | 742 |
<property> |
750 | 743 |
<name>input_pmid_to_oaid</name> |
751 |
<value>${workingDir}/pmid_to_oaid_producer/pmid_to_oaid</value>
|
|
744 |
<value>${workingDir}/ingest_pmc_idmapping_pmidtooaid/out</value>
|
|
752 | 745 |
</property> |
753 | 746 |
<property> |
754 | 747 |
<name>output_citation</name> |
Also available in: Unified diff
#757 hooking up ingest_pmc_idmapping_pmidtooaid subworkflow with mainworkflows/common/import. From now on citations are matched by pmid as well.