1
|
<NODE name="SET_INFO" isStart="true" type="SetProviderInfo">
|
2
|
<DESCRIPTION>Set information about current provider</DESCRIPTION>
|
3
|
<PARAMETERS>
|
4
|
<PARAM required="true" type="string" name="providerId" managedBy="system">$params.("dataprovider:id")$</PARAM>
|
5
|
<PARAM required="true" type="string" name="providerName" managedBy="system">$params.("dataprovider:name")$</PARAM>
|
6
|
<PARAM required="true" type="string" name="api" managedBy="system">$params.("dataprovider:interface")$</PARAM>
|
7
|
</PARAMETERS>
|
8
|
<ARCS>
|
9
|
<ARC to="SELECT_DOWNLOAD"/>
|
10
|
</ARCS>
|
11
|
</NODE>
|
12
|
|
13
|
<NODE name="SELECT_DOWNLOAD" type="Selection">
|
14
|
<DESCRIPTION>Should download?</DESCRIPTION>
|
15
|
<PARAMETERS>
|
16
|
<PARAM required="true" type="string" name="selection" managedBy="user" function="validValues(['YES', 'NO'])">YES</PARAM>
|
17
|
</PARAMETERS>
|
18
|
<ARCS>
|
19
|
<ARC name="NO" to="SELECT_UPDATECACHE"/>
|
20
|
<ARC name="YES" to="SELECT_MODE"/>
|
21
|
</ARCS>
|
22
|
</NODE>
|
23
|
|
24
|
<NODE name="SELECT_MODE" type="Selection">
|
25
|
<DESCRIPTION>Set download mode</DESCRIPTION>
|
26
|
<PARAMETERS>
|
27
|
<PARAM required="true" type="string" name="selection" managedBy="user" function="validValues(['REFRESH','INCREMENTAL'])">INCREMENTAL</PARAM>
|
28
|
</PARAMETERS>
|
29
|
<ARCS>
|
30
|
<ARC to="DropContentObjectStore" name="REFRESH" />
|
31
|
<ARC to="findMdStore" name="INCREMENTAL" />
|
32
|
</ARCS>
|
33
|
</NODE>
|
34
|
|
35
|
<NODE name="DropContentObjectStore" type="DropContentObjectStore">
|
36
|
<DESCRIPTION>Drop content on the object Store</DESCRIPTION>
|
37
|
<PARAMETERS>
|
38
|
<PARAM required="true" type="string" name="objectstoreId" managedBy="system" category="OBJECTSTORE_ID">$params.("objs_id")$</PARAM>
|
39
|
</PARAMETERS>
|
40
|
<ARCS>
|
41
|
<ARC to="findMdStore"/>
|
42
|
</ARCS>
|
43
|
</NODE>
|
44
|
|
45
|
<NODE name="findMdStore" type="RetrieveMdStoreId">
|
46
|
<DESCRIPTION>Find MDStore</DESCRIPTION>
|
47
|
<PARAMETERS>
|
48
|
<PARAM required="true" type="string" name="providerId" managedBy="system">$params.("dataprovider:id")$</PARAM>
|
49
|
</PARAMETERS>
|
50
|
<ARCS>
|
51
|
<ARC to="fetchTransformed"/>
|
52
|
</ARCS>
|
53
|
</NODE>
|
54
|
|
55
|
<NODE name="fetchTransformed" type="FetchMultipleMDStoreRecords">
|
56
|
<DESCRIPTION>Fetch records from MDStore</DESCRIPTION>
|
57
|
<PARAMETERS>
|
58
|
<PARAM required="true" type="string" name="eprParam" managedBy="system">clean_epr</PARAM>
|
59
|
</PARAMETERS>
|
60
|
<ARCS>
|
61
|
<ARC to="retrieveURL"/>
|
62
|
</ARCS>
|
63
|
</NODE>
|
64
|
|
65
|
<NODE name="retrieveURL" type="RetrieveURLS">
|
66
|
<DESCRIPTION>Retrieve URL To Download from MDStore</DESCRIPTION>
|
67
|
<PARAMETERS>
|
68
|
<PARAM required="true" type="string" name="xpath" managedBy="user">//*[local-name()='metadata']//*[local-name()='fulltext']/text()</PARAM>
|
69
|
<PARAM required="true" type="string" name="xpathOpenAccess" managedBy="user">//*[local-name()='metadata']//*[local-name()='accessrights']/text()</PARAM>
|
70
|
<PARAM required="true" type="string" name="xpathEmbargoDate" managedBy="user">//*[local-name()='metadata']//*[local-name()='embargoenddate']/text()</PARAM>
|
71
|
<PARAM required="true" type="string" name="inputEprParam" managedBy="system">clean_epr</PARAM>
|
72
|
<PARAM required="true" type="string" name="outputEprParam" managedBy="system">item_epr</PARAM>
|
73
|
</PARAMETERS>
|
74
|
<ARCS>
|
75
|
<ARC to="downloadRecords"/>
|
76
|
</ARCS>
|
77
|
</NODE>
|
78
|
|
79
|
|
80
|
<NODE name="downloadRecords" type="DownloadFromMetadataOpenaire">
|
81
|
<DESCRIPTION>Download records</DESCRIPTION>
|
82
|
<PARAMETERS>
|
83
|
<PARAM required="true" type="string" name="inputeprParam" managedBy="system">item_epr</PARAM>
|
84
|
<PARAM required="true" type="string" name="objectStoreID" managedBy="system" category="OBJECTSTORE_ID">$params.("objs_id")$</PARAM>
|
85
|
<PARAM required="true" type="string" name="plugin" managedBy="user" function="obtainValues('listDownloadPlugins', {});"></PARAM>
|
86
|
<PARAM required="false" type="string" name="basepath" managedBy="user"></PARAM>
|
87
|
<PARAM required="true" type="string" name="protocol" managedBy="user" function="validValues(['HTTP', 'HTTPS', 'FTP', 'File_System', 'FTPS'])"></PARAM>
|
88
|
<PARAM required="true" type="string" name="mimeType" managedBy="user" function="validValues(['pdf', 'application/pdf', 'xml', 'file::WoS', 'text', 'text/plain','text/html'])"></PARAM>
|
89
|
<PARAM required="false" type="string" name="regularExpression" managedBy="user"></PARAM>
|
90
|
<PARAM required="false" type="int" name="numberOfThreads" managedBy="user">1</PARAM>
|
91
|
<PARAM required="false" type="int" name="connectTimeoutMs" managedBy="user">10000</PARAM>
|
92
|
<PARAM required="false" type="int" name="readTimeoutMs" managedBy="user">10000</PARAM>
|
93
|
<PARAM required="false" type="int" name="sleepTimeMs" managedBy="user">0</PARAM>
|
94
|
</PARAMETERS>
|
95
|
<ARCS>
|
96
|
<ARC to="updateSizeObjectStore"/>
|
97
|
</ARCS>
|
98
|
</NODE>
|
99
|
|
100
|
<NODE name="updateSizeObjectStore" type="UpdateObjectStoreSize">
|
101
|
<DESCRIPTION>Download records</DESCRIPTION>
|
102
|
<PARAMETERS>
|
103
|
<PARAM required="true" type="string" name="objectStoreIdParam" managedBy="system" category="OBJECTSTORE_ID">$params.("objs_id")$</PARAM>
|
104
|
</PARAMETERS>
|
105
|
<ARCS>
|
106
|
<ARC to="UPDATE_INFO"/>
|
107
|
</ARCS>
|
108
|
</NODE>
|
109
|
|
110
|
<NODE name="UPDATE_INFO" type="ObjectStoreToApiExtraField">
|
111
|
<DESCRIPTION>Update datasource API extra fields</DESCRIPTION>
|
112
|
<PARAMETERS>
|
113
|
<PARAM required="true" type="string" name="objId" managedBy="system">$params.("objs_id")$</PARAM>
|
114
|
<PARAM required="true" type="string" name="datasourceId" managedBy="system">$params.("dataprovider:id")$</PARAM>
|
115
|
<PARAM required="true" type="string" name="datasourceInterface" managedBy="system">$params.("dataprovider:interface")$</PARAM>
|
116
|
<PARAM required="true" type="string" name="extraFieldForTotal" managedBy="system">last_download_total</PARAM>
|
117
|
<PARAM required="true" type="string" name="extraFieldForDate" managedBy="system">last_download_date</PARAM>
|
118
|
<PARAM required="true" type="string" name="extraFieldForObjId" managedBy="system">last_download_objId</PARAM>
|
119
|
</PARAMETERS>
|
120
|
<ARCS>
|
121
|
<ARC to="SELECT_UPDATECACHE"/>
|
122
|
</ARCS>
|
123
|
</NODE>
|
124
|
|
125
|
<NODE name="SELECT_UPDATECACHE" type="Selection">
|
126
|
<DESCRIPTION>Should update IIS cache?</DESCRIPTION>
|
127
|
<PARAMETERS>
|
128
|
<PARAM required="true" type="string" name="selection" managedBy="user" function="validValues(['YES', 'NO'])">NO</PARAM>
|
129
|
</PARAMETERS>
|
130
|
<ARCS>
|
131
|
<ARC name="NO" to="success"/>
|
132
|
<ARC name="YES" to="UPDATE_CACHE"/>
|
133
|
</ARCS>
|
134
|
</NODE>
|
135
|
|
136
|
<NODE name="UPDATE_CACHE" type="IISCacheBuilder">
|
137
|
<DESCRIPTION>Update IIS cache with latest objectStore content</DESCRIPTION>
|
138
|
<PARAMETERS>
|
139
|
<PARAM required="true" type="string" name="hadoopJob" managedBy="system">iisCacheBuilderJob</PARAM>
|
140
|
<PARAM required="true" type="string" name="objectStoreId" managedBy="system">$params.("objs_id")$</PARAM>
|
141
|
<PARAM required="true" type="string" name="cluster" managedBy="system">IIS</PARAM>
|
142
|
<PARAM required="true" type="boolean" name="simulation" managedBy="system">false</PARAM>
|
143
|
</PARAMETERS>
|
144
|
<ARCS>
|
145
|
<ARC to="success" />
|
146
|
</ARCS>
|
147
|
</NODE>
|