Project

General

Profile

1 33011 sandro.lab
 <NODE name="SET_INFO" isStart="true" type="SetProviderInfo">
2
	<DESCRIPTION>Set information about current provider</DESCRIPTION>
3
	<PARAMETERS>
4
		<PARAM required="true" type="string" name="providerId" managedBy="system">$params.("dataprovider:id")$</PARAM>
5
		<PARAM required="true" type="string" name="providerName" managedBy="system">$params.("dataprovider:name")$</PARAM>
6
		<PARAM required="true" type="string" name="api" managedBy="system">$params.("dataprovider:interface")$</PARAM>
7
	</PARAMETERS>
8
	<ARCS>
9 43608 claudio.at
		<ARC to="SELECT_DOWNLOAD"/>
10 33011 sandro.lab
	</ARCS>
11
</NODE>
12
13 43608 claudio.at
<NODE name="SELECT_DOWNLOAD" type="Selection">
14
	<DESCRIPTION>Should download?</DESCRIPTION>
15
	<PARAMETERS>
16 43609 claudio.at
		<PARAM required="true" type="string" name="selection" managedBy="user" function="validValues(['YES', 'NO'])">YES</PARAM>
17 43608 claudio.at
	</PARAMETERS>
18
	<ARCS>
19
		<ARC name="NO" to="SELECT_UPDATECACHE"/>
20
		<ARC name="YES" to="SELECT_MODE"/>
21
	</ARCS>
22
</NODE>
23
24 41467 sandro.lab
<NODE name="SELECT_MODE" type="Selection">
25 43775 alessia.ba
	<DESCRIPTION>Set download mode</DESCRIPTION>
26 41467 sandro.lab
	<PARAMETERS>
27
		<PARAM required="true" type="string" name="selection" managedBy="user" function="validValues(['REFRESH','INCREMENTAL'])">INCREMENTAL</PARAM>
28
	</PARAMETERS>
29
	<ARCS>
30
		<ARC to="DropContentObjectStore" name="REFRESH" />
31
		<ARC to="findMdStore" name="INCREMENTAL" />
32
	</ARCS>
33
</NODE>
34
35
<NODE name="DropContentObjectStore" type="DropContentObjectStore">
36
	<DESCRIPTION>Drop content on the object Store</DESCRIPTION>
37
	<PARAMETERS>
38
		<PARAM required="true" type="string" name="objectstoreId" managedBy="system" category="OBJECTSTORE_ID">$params.("objs_id")$</PARAM>
39
	</PARAMETERS>
40
	<ARCS>
41
		<ARC to="findMdStore"/>
42
	</ARCS>
43
</NODE>
44
45 33011 sandro.lab
<NODE name="findMdStore" type="RetrieveMdStoreId">
46
	<DESCRIPTION>Find MDStore</DESCRIPTION>
47
	<PARAMETERS>
48
		<PARAM required="true" type="string" name="providerId" managedBy="system">$params.("dataprovider:id")$</PARAM>
49
	</PARAMETERS>
50
	<ARCS>
51
		<ARC to="fetchTransformed"/>
52
	</ARCS>
53
</NODE>
54
55
<NODE name="fetchTransformed" type="FetchMultipleMDStoreRecords">
56
	<DESCRIPTION>Fetch records from MDStore</DESCRIPTION>
57
	<PARAMETERS>
58
		<PARAM required="true" type="string" name="eprParam" managedBy="system">clean_epr</PARAM>
59
	</PARAMETERS>
60
	<ARCS>
61
		<ARC to="retrieveURL"/>
62
	</ARCS>
63
</NODE>
64
65
<NODE name="retrieveURL" type="RetrieveURLS">
66
	<DESCRIPTION>Retrieve URL To Download from MDStore</DESCRIPTION>
67
	<PARAMETERS>
68 48139 alessia.ba
		<PARAM required="true" type="string" name="xpath" managedBy="user">//*[local-name()='metadata']//*[local-name()='fulltext']/text()</PARAM>
69 33011 sandro.lab
		<PARAM required="true" type="string" name="xpathOpenAccess" managedBy="user">//*[local-name()='metadata']//*[local-name()='accessrights']/text()</PARAM>
70
		<PARAM required="true" type="string" name="xpathEmbargoDate" managedBy="user">//*[local-name()='metadata']//*[local-name()='embargoenddate']/text()</PARAM>
71
		<PARAM required="true" type="string" name="inputEprParam" managedBy="system">clean_epr</PARAM>
72
		<PARAM required="true" type="string" name="outputEprParam" managedBy="system">item_epr</PARAM>
73
	</PARAMETERS>
74
	<ARCS>
75
		<ARC to="downloadRecords"/>
76
	</ARCS>
77
</NODE>
78
79
80
<NODE name="downloadRecords" type="DownloadFromMetadataOpenaire">
81
	<DESCRIPTION>Download records</DESCRIPTION>
82
	<PARAMETERS>
83
		<PARAM required="true" type="string" name="inputeprParam" managedBy="system">item_epr</PARAM>
84 33445 sandro.lab
		<PARAM required="true" type="string" name="objectStoreID" managedBy="system" category="OBJECTSTORE_ID">$params.("objs_id")$</PARAM>
85 33011 sandro.lab
		<PARAM required="true" type="string" name="plugin" managedBy="user" function="obtainValues('listDownloadPlugins', {});"></PARAM>
86
		<PARAM required="false" type="string" name="basepath" managedBy="user"></PARAM>
87
		<PARAM required="true" type="string" name="protocol" managedBy="user" function="validValues(['HTTP', 'HTTPS', 'FTP', 'File_System', 'FTPS'])"></PARAM>
88 39991 sandro.lab
		<PARAM required="true" type="string" name="mimeType" managedBy="user" function="validValues(['pdf', 'application/pdf', 'xml', 'file::WoS', 'text', 'text/plain','text/html'])"></PARAM>
89 37568 sandro.lab
		<PARAM required="false" type="string" name="regularExpression" managedBy="user"></PARAM>
90 48139 alessia.ba
		<PARAM required="false" type="int" name="numberOfThreads" managedBy="user">1</PARAM>
91
		<PARAM required="false" type="int" name="connectTimeoutMs" managedBy="user">10000</PARAM>
92
		<PARAM required="false" type="int" name="readTimeoutMs" managedBy="user">10000</PARAM>
93 42135 alessia.ba
		<PARAM required="false" type="int" name="sleepTimeMs" managedBy="user">0</PARAM>
94 33011 sandro.lab
	</PARAMETERS>
95
	<ARCS>
96
		<ARC to="updateSizeObjectStore"/>
97
	</ARCS>
98
</NODE>
99
100
<NODE name="updateSizeObjectStore" type="UpdateObjectStoreSize">
101
	<DESCRIPTION>Download records</DESCRIPTION>
102
	<PARAMETERS>
103 33445 sandro.lab
		<PARAM required="true" type="string" name="objectStoreIdParam" managedBy="system" category="OBJECTSTORE_ID">$params.("objs_id")$</PARAM>
104 33011 sandro.lab
	</PARAMETERS>
105
	<ARCS>
106
		<ARC to="UPDATE_INFO"/>
107
	</ARCS>
108
</NODE>
109
110
<NODE name="UPDATE_INFO" type="ObjectStoreToApiExtraField">
111 43616 claudio.at
	<DESCRIPTION>Update datasource API extra fields</DESCRIPTION>
112 33011 sandro.lab
	<PARAMETERS>
113
		<PARAM required="true" type="string" name="objId" managedBy="system">$params.("objs_id")$</PARAM>
114
		<PARAM required="true" type="string" name="datasourceId" managedBy="system">$params.("dataprovider:id")$</PARAM>
115
		<PARAM required="true" type="string" name="datasourceInterface" managedBy="system">$params.("dataprovider:interface")$</PARAM>
116
		<PARAM required="true" type="string" name="extraFieldForTotal" managedBy="system">last_download_total</PARAM>
117
		<PARAM required="true" type="string" name="extraFieldForDate" managedBy="system">last_download_date</PARAM>
118
		<PARAM required="true" type="string" name="extraFieldForObjId" managedBy="system">last_download_objId</PARAM>
119
	</PARAMETERS>
120
	<ARCS>
121 43608 claudio.at
		<ARC to="SELECT_UPDATECACHE"/>
122 33011 sandro.lab
	</ARCS>
123
</NODE>
124 43591 claudio.at
125 43608 claudio.at
<NODE name="SELECT_UPDATECACHE" type="Selection">
126 43591 claudio.at
	<DESCRIPTION>Should update IIS cache?</DESCRIPTION>
127
	<PARAMETERS>
128 43592 claudio.at
		<PARAM required="true" type="string" name="selection" managedBy="user" function="validValues(['YES', 'NO'])">NO</PARAM>
129 43591 claudio.at
	</PARAMETERS>
130
	<ARCS>
131
		<ARC name="NO" to="success"/>
132
		<ARC name="YES" to="UPDATE_CACHE"/>
133
	</ARCS>
134
</NODE>
135
136
<NODE name="UPDATE_CACHE" type="IISCacheBuilder">
137
	<DESCRIPTION>Update IIS cache with latest objectStore content</DESCRIPTION>
138
	<PARAMETERS>
139
		<PARAM required="true" type="string" name="hadoopJob" managedBy="system">iisCacheBuilderJob</PARAM>
140
        <PARAM required="true" type="string" name="objectStoreId" managedBy="system">$params.("objs_id")$</PARAM>
141
        <PARAM required="true" type="string" name="cluster" managedBy="system">IIS</PARAM>
142
		<PARAM required="true" type="boolean" name="simulation"	managedBy="system">false</PARAM>
143
	</PARAMETERS>
144
	<ARCS>
145
		<ARC to="success" />
146
	</ARCS>
147
</NODE>