Revision 47563
Added by Marek Horst almost 7 years ago
modules/icm-iis-schemas/trunk/pom.xml.disabled | ||
---|---|---|
1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
2 |
<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd"> |
|
3 |
<parent> |
|
4 |
<groupId>eu.dnetlib</groupId> |
|
5 |
<artifactId>dnet-hadoop-parent</artifactId> |
|
6 |
<version>1.0.0</version> |
|
7 |
</parent> |
|
8 |
<modelVersion>4.0.0</modelVersion> |
|
9 |
<artifactId>icm-iis-schemas</artifactId> |
|
10 |
<packaging>jar</packaging> |
|
11 |
<version>1.0.1-SNAPSHOT</version> |
|
12 |
|
|
13 |
<scm> |
|
14 |
<developerConnection> |
|
15 |
scm:svn:https://svn.driver.research-infrastructures.eu/driver/dnet40/modules/icm-iis-schemas/trunk |
|
16 |
</developerConnection> |
|
17 |
</scm> |
|
18 |
|
|
19 |
<properties> |
|
20 |
<project.build.sourceEncoding>UTF-8</project.build.sourceEncoding> |
|
21 |
</properties> |
|
22 |
<dependencies> |
|
23 |
<dependency> |
|
24 |
<groupId>org.apache.avro</groupId> |
|
25 |
<artifactId>avro</artifactId> |
|
26 |
<version>${iis.avro.version}</version> |
|
27 |
</dependency> |
|
28 |
</dependencies> |
|
29 |
<build> |
|
30 |
<plugins> |
|
31 |
<!-- Plugin that generates Java classes from Avro schemas --> |
|
32 |
<plugin> |
|
33 |
<groupId>org.apache.avro</groupId> |
|
34 |
<artifactId>avro-maven-plugin</artifactId> |
|
35 |
<version>${iis.avro.version}</version> |
|
36 |
<executions> |
|
37 |
<execution> |
|
38 |
<phase>generate-sources</phase> |
|
39 |
<goals> |
|
40 |
<goal>schema</goal> |
|
41 |
<goal>idl-protocol</goal> |
|
42 |
</goals> |
|
43 |
<configuration> |
|
44 |
<excludes> |
|
45 |
<exclude>**/schemas/avro/**</exclude> |
|
46 |
<exclude>**/schemas/protobuf/**</exclude> |
|
47 |
</excludes> |
|
48 |
<sourceDirectory>${project.basedir}/src/main/resources/eu/dnetlib/iis/</sourceDirectory> |
|
49 |
<outputDirectory>${project.basedir}/target/generated-sources/java/</outputDirectory> |
|
50 |
</configuration> |
|
51 |
</execution> |
|
52 |
</executions> |
|
53 |
</plugin> |
|
54 |
<!-- This plugin makes the Maven->Update Project Configuration |
|
55 |
not forget about the "target/generated-sources/java" source path--> |
|
56 |
<plugin> |
|
57 |
<groupId>org.codehaus.mojo</groupId> |
|
58 |
<artifactId>build-helper-maven-plugin</artifactId> |
|
59 |
<executions> |
|
60 |
<execution> |
|
61 |
<id>add-source</id> |
|
62 |
<phase>generate-sources</phase> |
|
63 |
<goals> |
|
64 |
<goal>add-source</goal> |
|
65 |
</goals> |
|
66 |
<configuration> |
|
67 |
<sources> |
|
68 |
<source>${project.build.directory}/generated-sources/java/</source> |
|
69 |
</sources> |
|
70 |
</configuration> |
|
71 |
</execution> |
|
72 |
</executions> |
|
73 |
</plugin> |
|
74 |
</plugins> |
|
75 |
<pluginManagement> |
|
76 |
<plugins> |
|
77 |
<!--This plugin's configuration is used to store Eclipse m2e settings only. It has no influence on the Maven build itself.--> |
|
78 |
<plugin> |
|
79 |
<groupId>org.eclipse.m2e</groupId> |
|
80 |
<artifactId>lifecycle-mapping</artifactId> |
|
81 |
<version>1.0.0</version> |
|
82 |
<configuration> |
|
83 |
<lifecycleMappingMetadata> |
|
84 |
<pluginExecutions> |
|
85 |
<pluginExecution> |
|
86 |
<pluginExecutionFilter> |
|
87 |
<groupId> |
|
88 |
org.apache.avro |
|
89 |
</groupId> |
|
90 |
<artifactId> |
|
91 |
avro-maven-plugin |
|
92 |
</artifactId> |
|
93 |
<versionRange> |
|
94 |
[1.7.4,) |
|
95 |
</versionRange> |
|
96 |
<goals> |
|
97 |
<goal>idl-protocol</goal> |
|
98 |
<goal>schema</goal> |
|
99 |
</goals> |
|
100 |
</pluginExecutionFilter> |
|
101 |
<action> |
|
102 |
<ignore /> |
|
103 |
</action> |
|
104 |
</pluginExecution> |
|
105 |
<pluginExecution> |
|
106 |
<pluginExecutionFilter> |
|
107 |
<groupId> |
|
108 |
org.codehaus.mojo |
|
109 |
</groupId> |
|
110 |
<artifactId> |
|
111 |
build-helper-maven-plugin |
|
112 |
</artifactId> |
|
113 |
<versionRange> |
|
114 |
[1.7,) |
|
115 |
</versionRange> |
|
116 |
<goals> |
|
117 |
<goal>add-source</goal> |
|
118 |
</goals> |
|
119 |
</pluginExecutionFilter> |
|
120 |
<action> |
|
121 |
<ignore /> |
|
122 |
</action> |
|
123 |
</pluginExecution> |
|
124 |
</pluginExecutions> |
|
125 |
</lifecycleMappingMetadata> |
|
126 |
</configuration> |
|
127 |
</plugin> |
|
128 |
</plugins> |
|
129 |
</pluginManagement> |
|
130 |
</build> |
|
131 |
<repositories> |
|
132 |
</repositories> |
|
133 |
</project> |
|
0 | 134 |
modules/icm-iis-schemas/trunk/src/main/java/helloworld/HelloWorld.java | ||
---|---|---|
1 |
package helloworld; |
|
2 |
|
|
3 |
/** |
|
4 |
* This class is here only to make the Sonar happy, since when the project |
|
5 |
* does not contain any Java code, Sonar complains. If currently there is some |
|
6 |
* other code in the project, feel free to delete this class along with its |
|
7 |
* package. |
|
8 |
* @author Mateusz Kobos |
|
9 |
* |
|
10 |
*/ |
|
11 |
public class HelloWorld { |
|
12 |
|
|
13 |
public static void main(String[] args){ |
|
14 |
System.out.println("Hello world!"); |
|
15 |
} |
|
16 |
|
|
17 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/metadataextraction/ReferenceMetadata.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.metadataextraction.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "ReferenceBasicMetadata.avdl"; |
|
5 |
|
|
6 |
record ReferenceMetadata { |
|
7 |
ReferenceBasicMetadata basicMetadata; |
|
8 |
// reference position in bibliography, starting with '1' |
|
9 |
union { null , int } position = null; |
|
10 |
// raw citation string held here just in case - maybe we will be able to use it |
|
11 |
// instead of basicMetadata if the latter one turns out to be of a low quality |
|
12 |
union { null , string } text = null; |
|
13 |
} |
|
14 |
|
|
15 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/metadataextraction/ExtractedDocumentMetadataEnvelope.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.metadataextraction.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "ExtractedDocumentMetadata.avdl"; |
|
5 |
|
|
6 |
record ExtractedDocumentMetadataEnvelope { |
|
7 |
eu.dnetlib.iis.metadataextraction.schemas.ExtractedDocumentMetadata data; |
|
8 |
string origin; |
|
9 |
} |
|
10 |
|
|
11 |
} |
|
12 |
|
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/metadataextraction/ReferenceBasicMetadata.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.metadataextraction.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record Range { |
|
5 |
union { null , string } start = null; |
|
6 |
union { null , string } end = null; |
|
7 |
} |
|
8 |
|
|
9 |
record ReferenceBasicMetadata { |
|
10 |
union { null , string } title = null; |
|
11 |
// author names (a single string corresponds to a single author) |
|
12 |
union { null , array<string> } authors = null; |
|
13 |
union { null , Range } pages = null; |
|
14 |
// the name of a journal, a book or anything that the article comes from |
|
15 |
union { null , string } source = null; |
|
16 |
union { null , string } volume = null; |
|
17 |
union { null , string } year = null; |
|
18 |
|
|
19 |
union { null , string } edition = null; |
|
20 |
union { null , string } publisher = null; |
|
21 |
union { null , string } location = null; |
|
22 |
union { null , string } series = null; |
|
23 |
union { null , string } issue = null; |
|
24 |
union { null , string } url = null; |
|
25 |
union { null , map<string> } externalIds = null; |
|
26 |
} |
|
27 |
|
|
28 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/metadataextraction/DocumentText.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.metadataextraction.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record DocumentText { |
|
5 |
// document identifier |
|
6 |
// foreign key: DocumentMetadata.id ("raw document metadata" data store) |
|
7 |
string id; |
|
8 |
// document fulltext |
|
9 |
union { null , string } text = null; |
|
10 |
} |
|
11 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/metadataextraction/ExtractedDocumentMetadata.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.metadataextraction.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "Affiliation.avdl"; |
|
5 |
import idl "ReferenceBasicMetadata.avdl"; |
|
6 |
import idl "ReferenceMetadata.avdl"; |
|
7 |
|
|
8 |
record Author { |
|
9 |
// author name extracted from pdf document |
|
10 |
union { null , string } authorFullName = null; |
|
11 |
// position on affiliations list |
|
12 |
union { null , array<int> } affiliationPositions = null; |
|
13 |
} |
|
14 |
|
|
15 |
record ExtractedDocumentMetadata { |
|
16 |
// ID of the document, foreign key: Document.id ("document" data store) |
|
17 |
string id; |
|
18 |
|
|
19 |
// moved from DocumentBasicMetadata |
|
20 |
// title |
|
21 |
union { null , string } title = null; |
|
22 |
// abstract or description |
|
23 |
union { null , string } abstract = null; |
|
24 |
union { null , string } language = null; |
|
25 |
// list of keywords (free form) |
|
26 |
union { null , array<string> } keywords = null; |
|
27 |
// alternative identifier (e.g. internal publisher's identifiers) |
|
28 |
union { null , map<string> } externalIdentifiers = null; |
|
29 |
// name of journal in which the article is published |
|
30 |
union { null , string } journal = null; |
|
31 |
// year of publication |
|
32 |
union { null , int } year = null; |
|
33 |
// publisher name |
|
34 |
union { null , string } publisher = null; |
|
35 |
// end of: moved from DocumentBasicMetadata |
|
36 |
|
|
37 |
// references extracted from pfd document |
|
38 |
union { null , array<ReferenceMetadata> } references = null; |
|
39 |
// author names extracted from pdf document |
|
40 |
// union { null , array<string> } authorFullNames = null; |
|
41 |
// authors extracted from PDF document along with position of affiliations list |
|
42 |
union { null , array<Author> } authors = null; |
|
43 |
|
|
44 |
// affiliations extracted from PDF document |
|
45 |
union { null , array<Affiliation> } affiliations = null; |
|
46 |
|
|
47 |
// additional fields supplementing basicMetadata |
|
48 |
// journal volume in which the article is published |
|
49 |
union { null , string } volume = null; |
|
50 |
// journal issue in which the article is published |
|
51 |
union { null , string } issue = null; |
|
52 |
// page range in which the article is published |
|
53 |
union { null , Range } pages = null; |
|
54 |
|
|
55 |
// propagated from pmc ExtractedDocumentMetadata#entityType |
|
56 |
union { null , string } publicationTypeName = null; |
|
57 |
} |
|
58 |
|
|
59 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/metadataextraction/Affiliation.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.metadataextraction.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record Affiliation { |
|
5 |
|
|
6 |
// organization name |
|
7 |
union { null , string } organization = null; |
|
8 |
// country name |
|
9 |
union { null , string } countryName = null; |
|
10 |
// country ISO 3166-1 alpha-2 uppercased code |
|
11 |
union { null , string } countryCode = null; |
|
12 |
// address |
|
13 |
union { null , string } address = null; |
|
14 |
// raw affiliation text |
|
15 |
string rawText; |
|
16 |
} |
|
17 |
|
|
18 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/export/SimilarToPerson.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.export.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "../websiteusage/PersonWebsiteUsageSimilarities.avdl"; |
|
5 |
|
|
6 |
record SimilarToPerson { |
|
7 |
// foreign key: PersonWithInferencedData.id ("person with inferenced data" data store) |
|
8 |
string personId; |
|
9 |
union { null , eu.dnetlib.iis.websiteusage.schemas.PersonWebsiteUsageSimilarities } similarities = null; |
|
10 |
} |
|
11 |
|
|
12 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/export/Citations.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.export.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "../common/citations/CitationEntry.avdl"; |
|
5 |
|
|
6 |
record Citations { |
|
7 |
// citing document OA+ identifier |
|
8 |
string documentId; |
|
9 |
array<eu.dnetlib.iis.common.citations.schemas.CitationEntry> citations; |
|
10 |
} |
|
11 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/export/DocumentToConceptIds.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.export.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record Concept { |
|
5 |
// concept identifier |
|
6 |
string id; |
|
7 |
// Find more details on `confidenceLevel` constraints in eu/dnetlib/iis/README.markdown file. |
|
8 |
union { null , float } confidenceLevel = null; |
|
9 |
} |
|
10 |
|
|
11 |
record DocumentToConceptIds { |
|
12 |
// document ID, foreign key: DocumentText.id |
|
13 |
string documentId; |
|
14 |
array<Concept> concepts; |
|
15 |
} |
|
16 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/export/IdWithText.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.export.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record IdWithText { |
|
5 |
string id; |
|
6 |
string text; |
|
7 |
} |
|
8 |
|
|
9 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/export/IdWithConfidenceLevel.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.export.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record IdWithConfidenceLevel { |
|
5 |
string id; |
|
6 |
// Find more details on `confidenceLevel` constraints in eu/dnetlib/iis/README.markdown file. |
|
7 |
union { null , float } confidenceLevel = null; |
|
8 |
} |
|
9 |
|
|
10 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/export/DocumentMetadata.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.export.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "../metadataextraction/Affiliation.avdl"; |
|
5 |
|
|
6 |
record DocumentMetadata { |
|
7 |
// ID of the document, foreign key: Document.id ("document" data store) |
|
8 |
string id; |
|
9 |
|
|
10 |
// affiliations extracted from PDF document |
|
11 |
union { null , array<eu.dnetlib.iis.metadataextraction.schemas.Affiliation> } affiliations = null; |
|
12 |
|
|
13 |
} |
|
14 |
|
|
15 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/export/SimilarToDocument.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.export.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record SimilarToDocument { |
|
5 |
// foreign key: DocumentWithInferencedData.id ("document with inferenced data" data store) |
|
6 |
string documentId; |
|
7 |
union { null , float } covisitedSimilarity = null; |
|
8 |
} |
|
9 |
|
|
10 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/export/auxiliary/Identifier.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.export.auxiliary.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record Identifier { |
|
5 |
string id; |
|
6 |
} |
|
7 |
|
|
8 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/export/SimilarToDataSet.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.export.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "../websiteusage/DataSetWebsiteUsageSimilarities.avdl"; |
|
5 |
|
|
6 |
record SimilarToDataSet { |
|
7 |
// foreign key: DataSetWithInferencedData.id "data set with inferenced data" data store) |
|
8 |
string dataSetId; |
|
9 |
union { null , eu.dnetlib.iis.websiteusage.schemas.DataSetWebsiteUsageSimilarities } similarities = null; |
|
10 |
} |
|
11 |
|
|
12 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/citationmatching/Citation.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.citationmatching.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record Citation { |
|
5 |
// citing document identifier |
|
6 |
string sourceDocumentId; |
|
7 |
// position of citation in the bibliography of the source document |
|
8 |
int position; |
|
9 |
// cited document identifier |
|
10 |
string destinationDocumentId; |
|
11 |
// A number from [0, 1] range. The greater the value, the greater the |
|
12 |
// confidence that the document->document citation link is correct. |
|
13 |
// Find more details on `confidenceLevel` constraints in eu/dnetlib/iis/README.markdown file. |
|
14 |
float confidenceLevel; |
|
15 |
} |
|
16 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/citationmatching/DocumentMetadata.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.citationmatching.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record BasicMetadata { |
|
5 |
array<string> authors; |
|
6 |
union { null , string } title = null; |
|
7 |
union { null , string } journal = null; |
|
8 |
union { null , string } pages = null; |
|
9 |
union { null , string } year = null; |
|
10 |
} |
|
11 |
|
|
12 |
record ReferenceMetadata { |
|
13 |
// reference position in the bibliography |
|
14 |
int position; |
|
15 |
BasicMetadata basicMetadata; |
|
16 |
union { null , string } rawText = null; |
|
17 |
} |
|
18 |
|
|
19 |
record DocumentMetadata { |
|
20 |
string id; |
|
21 |
BasicMetadata basicMetadata; |
|
22 |
array<ReferenceMetadata> references; |
|
23 |
} |
|
24 |
} |
|
25 |
|
|
26 |
|
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/citationmatching/direct/Citation.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.citationmatching.direct.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record Citation { |
|
5 |
// citing document OA+ identifier |
|
6 |
string sourceDocumentId; |
|
7 |
// position of citation in the bibliography of the source document |
|
8 |
int position; |
|
9 |
// cited document OA+ identifier |
|
10 |
string destinationDocumentId; |
|
11 |
} |
|
12 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/citationmatching/direct/DocumentMetadata.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.citationmatching.direct.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record ReferenceMetadata { |
|
5 |
// reference position in the bibliography |
|
6 |
int position; |
|
7 |
// external identifiers |
|
8 |
union { null , map<string> } externalIds = null; |
|
9 |
} |
|
10 |
|
|
11 |
record DocumentMetadata { |
|
12 |
string id; |
|
13 |
// alternative identifier (e.g. internal publisher's identifiers) |
|
14 |
union { null , map<string> } externalIdentifiers = null; |
|
15 |
// detailed publication type name, originates from extracted metadata |
|
16 |
union { null , string } publicationTypeName = null; |
|
17 |
array<ReferenceMetadata> references; |
|
18 |
} |
|
19 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/citationmatching/PartialCitation.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.citationmatching.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record PartialCitation { |
|
5 |
// citing document identifier |
|
6 |
string sourceDocumentId; |
|
7 |
// position of citation in the bibliography of the source document |
|
8 |
int position; |
|
9 |
// cited document identifier |
|
10 |
string destinationDocumentId; |
|
11 |
// A number from [0, 1] range. The greater the value, the greater the |
|
12 |
// confidence that the document->document citation link is correct. |
|
13 |
// Find more details on `confidenceLevel` constraints in eu/dnetlib/iis/README.markdown file. |
|
14 |
float confidenceLevel; |
|
15 |
} |
|
16 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/transformers/metadatamerger/ExtractedDocumentMetadataMergedWithOriginal.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.transformers.metadatamerger.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "../../metadataextraction/ReferenceMetadata.avdl"; |
|
5 |
|
|
6 |
record PublicationType { |
|
7 |
boolean article = false; |
|
8 |
boolean dataset = false; |
|
9 |
} |
|
10 |
|
|
11 |
record ExtractedDocumentMetadataMergedWithOriginal { |
|
12 |
// ID of the document, foreign key: Document.id ("document" data store) |
|
13 |
string id; |
|
14 |
// original metadata merged with extracted from pdf document |
|
15 |
|
|
16 |
// moved from DocumentBasicMetadata |
|
17 |
// title |
|
18 |
union { null , string } title = null; |
|
19 |
// abstract or description |
|
20 |
union { null , string } abstract = null; |
|
21 |
union { null , string } language = null; |
|
22 |
// list of keywords (free form) |
|
23 |
union { null , array<string> } keywords = null; |
|
24 |
// alternative identifier (e.g. internal publisher's identifiers) |
|
25 |
union { null , map<string> } externalIdentifiers = null; |
|
26 |
// name of journal in which the article is published |
|
27 |
union { null , string } journal = null; |
|
28 |
// year of publication |
|
29 |
union { null , int } year = null; |
|
30 |
// publisher name |
|
31 |
union { null , string } publisher = null; |
|
32 |
// end of: moved from DocumentBasicMetadata |
|
33 |
// publication type, originates from metadata |
|
34 |
PublicationType publicationType; |
|
35 |
|
|
36 |
// references extracted from pfd document |
|
37 |
union { null , array<eu.dnetlib.iis.metadataextraction.schemas.ReferenceMetadata> } references = null; |
|
38 |
// author names extracted from pdf document |
|
39 |
union { null , array<string> } extractedAuthorFullNames = null; |
|
40 |
// author ids retrieved from "document" datastore |
|
41 |
union { null , array<string> } authorIds = null; |
|
42 |
|
|
43 |
// additional fields extracted from PDF document |
|
44 |
// journal volume in which the article is published |
|
45 |
union { null , string } volume = null; |
|
46 |
// journal issue in which the article is published |
|
47 |
union { null , string } issue = null; |
|
48 |
// page range in which the article is published |
|
49 |
union { null , eu.dnetlib.iis.metadataextraction.schemas.Range } pages = null; |
|
50 |
|
|
51 |
// detailed publication type name, originates from extracted metadata |
|
52 |
union { null , string } publicationTypeName = null; |
|
53 |
} |
|
54 |
|
|
55 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/websiteusage/DataSetsWithWebsiteUsageSimilarities.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.websiteusage.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "DataSetWebsiteUsageSimilarities.avdl"; |
|
5 |
|
|
6 |
record DataSetsWithWebsiteUsageSimilarities { |
|
7 |
// foreign key: DataSetReference.id ("data set" data store) |
|
8 |
string dataSetId; |
|
9 |
// foreign key: DataSetReference.id ("data set" data store) |
|
10 |
string otherDataSetId; |
|
11 |
union { null , DataSetWebsiteUsageSimilarities } similarities = null; |
|
12 |
} |
|
13 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/websiteusage/DataSetWebsiteUsageSimilarities.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.websiteusage.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record DataSetWebsiteUsageSimilarities { |
|
5 |
// coefficient from [0, 1] range, |
|
6 |
// the greater the number, the more similar the datasets w.r.t |
|
7 |
// being visited together |
|
8 |
union { null , float } covisitedSimilarity = null; |
|
9 |
// some other similarity metrics, to be specified by NKUA |
|
10 |
} |
|
11 |
|
|
12 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/websiteusage/PersonsWithWebsiteUsageSimilarities.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.websiteusage.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "PersonWebsiteUsageSimilarities.avdl"; |
|
5 |
|
|
6 |
record PersonsWithWebsiteUsageSimilarities { |
|
7 |
// foreign key: Person.id ("person" data store) |
|
8 |
string personId; |
|
9 |
// foreign key: Person.id ("person" data store) |
|
10 |
string otherPersonId; |
|
11 |
union { null , PersonWebsiteUsageSimilarities } similarities = null; |
|
12 |
} |
|
13 |
|
|
14 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/websiteusage/PersonWebsiteUsageSimilarities.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.websiteusage.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record PersonWebsiteUsageSimilarities { |
|
5 |
// coefficient from [0, 1] range, |
|
6 |
// the greater the number, the more similar the persons w.r.t being visited together |
|
7 |
union { null , float } covisitedSimilarity = null; |
|
8 |
// some other similarity metrics, to be specified by NKUA |
|
9 |
} |
|
10 |
|
|
11 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/websiteusage/LogEntry.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.websiteusage.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record LogEntry { |
|
5 |
// WARNING: the records in data store conforming to this schema have to be ordered by 'timestamp' field from the oldest to the newest. |
|
6 |
string timestamp; |
|
7 |
string action; |
|
8 |
union { null , string } user = null; |
|
9 |
union { null , string } session = null; |
|
10 |
union { null , string } data = null; |
|
11 |
} |
|
12 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/websiteusage/DocumentsWithWebsiteUsageSimilarities.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.websiteusage.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record DocumentsWithWebsiteUsageSimilarities { |
|
5 |
// foreign key: Document.id ("document" data store) |
|
6 |
string documentId; |
|
7 |
// foreign key: Document.id ("document" data store) |
|
8 |
string otherDocumentId; |
|
9 |
union { null , float } covisitedSimilarity = null; |
|
10 |
} |
|
11 |
|
|
12 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/websiteusage/DocumentToCommunity.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.websiteusage.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record DocumentToCommunity { |
|
5 |
// document identifier, foreign key: DocumentMetadata.id ("document metadata" data store) |
|
6 |
string SimilarDocid; |
|
7 |
// community identifier |
|
8 |
string cid; |
|
9 |
} |
|
10 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/common/DocumentId.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.common.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record DocumentId { |
|
5 |
// document identifier |
|
6 |
string id; |
|
7 |
} |
|
8 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/common/IdentifierMapping.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.common.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record IdentifierMapping { |
|
5 |
// original document identifier |
|
6 |
string originalId; |
|
7 |
// new document identifier |
|
8 |
string newId; |
|
9 |
} |
|
10 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/common/citations/Citation.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.common.citations.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "CitationEntry.avdl"; |
|
5 |
|
|
6 |
record Citation { |
|
7 |
// citing document OA+ identifier |
|
8 |
string sourceDocumentId; |
|
9 |
eu.dnetlib.iis.common.citations.schemas.CitationEntry entry; |
|
10 |
} |
|
11 |
} |
|
12 |
|
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/common/citations/CitationEntry.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.common.citations.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
// At least one of rawText, destinationDocumentId, externalDestinationDocumentIds fields is not empty. |
|
5 |
record CitationEntry { |
|
6 |
// position of citation in the bibliography of the source document |
|
7 |
int position; |
|
8 |
// raw citation text |
|
9 |
union { null , string } rawText = null; |
|
10 |
// cited document OA+ identifier (if referenced document is present in OA+) |
|
11 |
union { null , string } destinationDocumentId = null; |
|
12 |
// A number from [0, 1] range. The greater the value, the greater the |
|
13 |
// confidence that the document->document citation link is correct. |
|
14 |
// The `confidenceLevel` field is null if and only if the `destinationDocumentId` is null. |
|
15 |
// Find more details on `confidenceLevel` constraints in eu/dnetlib/iis/README.markdown file. |
|
16 |
union { null , float } confidenceLevel = null; |
|
17 |
// cited document identifiers (id type -> id) |
|
18 |
// WARNING: Id types are extracted from PMC data without any processing thus are subject to change without notice. |
|
19 |
// Currently (2014-05-12), the most popular types are "pmid" (PubMed ID) and "doi". |
|
20 |
map<string> externalDestinationDocumentIds; |
|
21 |
} |
|
22 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/common/citations/CitationEnvelope.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.common.citations.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "Citation.avdl"; |
|
5 |
|
|
6 |
|
|
7 |
record CitationEnvelope { |
|
8 |
eu.dnetlib.iis.common.citations.schemas.Citation data; |
|
9 |
string origin; |
|
10 |
} |
|
11 |
|
|
12 |
} |
|
13 |
|
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/ingest/pmc/metadata/ReferenceMetadata.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.ingest.pmc.metadata.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "ReferenceBasicMetadata.avdl"; |
|
5 |
|
|
6 |
record ReferenceMetadata { |
|
7 |
ReferenceBasicMetadata basicMetadata; |
|
8 |
// reference position in bibliography, starting with '1' |
|
9 |
union { null , int } position = null; |
|
10 |
// raw citation string held here just in case - maybe we will be able to use it |
|
11 |
// instead of basicMetadata if the latter one turns out to be of a low quality |
|
12 |
union { null , string } text = null; |
|
13 |
} |
|
14 |
|
|
15 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/ingest/pmc/metadata/ReferenceBasicMetadata.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.ingest.pmc.metadata.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record Range { |
|
5 |
union { null , string } start = null; |
|
6 |
union { null , string } end = null; |
|
7 |
} |
|
8 |
|
|
9 |
record ReferenceBasicMetadata { |
|
10 |
union { null , string } title = null; |
|
11 |
// author names (a single string corresponds to a single author) |
|
12 |
union { null , array<string> } authors = null; |
|
13 |
union { null , Range } pages = null; |
|
14 |
// the name of a journal, a book or anything that the article comes from |
|
15 |
union { null , string } source = null; |
|
16 |
union { null , string } volume = null; |
|
17 |
union { null , string } year = null; |
|
18 |
union { null , string } issue = null; |
|
19 |
map<string> externalIds; |
|
20 |
} |
|
21 |
|
|
22 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/ingest/pmc/metadata/ExtractedDocumentMetadata.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.ingest.pmc.metadata.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "ReferenceMetadata.avdl"; |
|
5 |
import idl "../../../metadataextraction/Affiliation.avdl"; |
|
6 |
|
|
7 |
record ExtractedDocumentMetadata { |
|
8 |
// OpenAIRE identifier of the document |
|
9 |
string id; |
|
10 |
// alternative identifier (e.g. pubmed identifier) |
|
11 |
union { null , map<string> } externalIdentifiers = null; |
|
12 |
// pubmed entity type |
|
13 |
string entityType; |
|
14 |
// name of journal in which the article is published |
|
15 |
union { null , string } journal = null; |
|
16 |
// references extracted from XML document |
|
17 |
union { null , array<ReferenceMetadata> } references = null; |
|
18 |
|
|
19 |
// affiliations extracted from XML document |
|
20 |
union { null , array<eu.dnetlib.iis.metadataextraction.schemas.Affiliation> } affiliations = null; |
|
21 |
|
|
22 |
// page range in which the article is published |
|
23 |
union { null , Range } pages = null; |
|
24 |
} |
|
25 |
|
|
26 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/documentssimilarity_with_fulltext/DocumentMetadata.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.documentssimilarity_with_fulltext.schemas") |
|
2 |
protocol IIS{ |
|
3 |
import idl "../importer/Person.avdl"; |
|
4 |
|
|
5 |
record DocumentMetadata { |
|
6 |
string id; |
|
7 |
union { null , string } title = null; |
|
8 |
union { null , string } abstract = null; |
|
9 |
// document fulltext |
|
10 |
// warning: may be a raw, non-normalised text, |
|
11 |
// i.e. may contain non-alphanumeric characters, page numbers, etc. |
|
12 |
union { null , string } text = null; |
|
13 |
union { null , array<string> } keywords = null; |
|
14 |
union { null , array<eu.dnetlib.iis.importer.schemas.Person> } authors = null; |
|
15 |
} |
|
16 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/documentssimilarity_with_fulltext/DocumentSimilarity.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.documentssimilarity_with_fulltext.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record DocumentSimilarity { |
|
5 |
// document identifier |
|
6 |
// foreign key: Document.id ("updated document" data store) |
|
7 |
string documentId; |
|
8 |
// identifier of a similar document, |
|
9 |
// foreign key: Document.id ("updated document" data store) |
|
10 |
string otherDocumentId; |
|
11 |
// level of similarity: coefficient from [0, 1] range, |
|
12 |
// the greater the number, the more similar the documents |
|
13 |
union { null , float } similarity = null; |
|
14 |
} |
|
15 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/statistics/DocumentToDocumentStatistics.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.statistics.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "CommonBasicCitationStatistics.avdl"; |
|
5 |
|
|
6 |
record DocumentToDocumentStatistics { |
|
7 |
// ID of the document, foreign key: Document.id ("document" data store) |
|
8 |
string documentId; |
|
9 |
|
|
10 |
CommonBasicCitationStatistics statistics; |
|
11 |
} |
|
12 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/statistics/ExtendedStatistics.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.statistics.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "BasicCitationStatistics.avdl"; |
|
5 |
|
|
6 |
// extended statistics for a group of documents; |
|
7 |
// for example documents of a given author, |
|
8 |
// documents of a given project or all documents in the system |
|
9 |
record ExtendedStatistics { |
|
10 |
|
|
11 |
BasicCitationStatistics basic; |
|
12 |
|
|
13 |
float averageNumberOfCitationsPerPaper; |
|
14 |
|
|
15 |
// keys: 1 10 50 100 250 500 |
|
16 |
map<int> numberOfPapersCitedAtLeastXTimes; |
|
17 |
|
|
18 |
} |
|
19 |
|
|
20 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/statistics/ProjectToProjectStatistics.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.statistics.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "CommonCoreStatistics.avdl"; |
|
5 |
|
|
6 |
record ProjectToProjectStatistics { |
|
7 |
// ID of the project, foreign key: Project.id ("project" data store) |
|
8 |
string projectId; |
|
9 |
|
|
10 |
CommonCoreStatistics statistics; |
|
11 |
} |
|
12 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/statistics/CommonCoreStatistics.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.statistics.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "CoreStatistics.avdl"; |
|
5 |
|
|
6 |
// core statistics of two kinds: |
|
7 |
// - counted for all papers in the group |
|
8 |
// - counted only for published papers |
|
9 |
record CommonCoreStatistics { |
|
10 |
|
|
11 |
// core statistics for all papers |
|
12 |
CoreStatistics allPapers; |
|
13 |
|
|
14 |
// core statistics for published papers |
|
15 |
CoreStatistics publishedPapers; |
|
16 |
|
|
17 |
} |
|
18 |
|
|
19 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/statistics/AuthorStatistics.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.statistics.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "CommonCoreStatistics.avdl"; |
|
5 |
|
|
6 |
record CoAuthor { |
|
7 |
string id; |
|
8 |
int coauthoredPapersCount; |
|
9 |
} |
|
10 |
|
|
11 |
record AuthorStatistics { |
|
12 |
|
|
13 |
CommonCoreStatistics core; |
|
14 |
|
|
15 |
array<CoAuthor> coAuthors; |
|
16 |
} |
|
17 |
|
|
18 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/statistics/CommonBasicCitationStatistics.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.statistics.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "BasicCitationStatistics.avdl"; |
|
5 |
|
|
6 |
// basic statistics of two kinds: |
|
7 |
// - counted for all incoming citations |
|
8 |
// - counted only for citations coming from published papers |
|
9 |
record CommonBasicCitationStatistics { |
|
10 |
|
|
11 |
// basic statistics containing |
|
12 |
// counts of citations FROM all papers |
|
13 |
BasicCitationStatistics citationsFromAllPapers; |
|
14 |
|
|
15 |
// basic statistics containing |
|
16 |
// counts of citations FROM published papers |
|
17 |
BasicCitationStatistics citationsFromPublishedPapers; |
|
18 |
|
|
19 |
} |
|
20 |
|
|
21 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/statistics/DocumentWithAuthorsAndCitations.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.statistics.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record DocumentWithAuthorsAndCitations { |
|
5 |
string documentId; |
|
6 |
|
|
7 |
boolean isPublished; |
|
8 |
|
|
9 |
string year; |
|
10 |
|
|
11 |
array<string> authorIds; |
|
12 |
|
|
13 |
array<string> referencedDocumentsIds; |
|
14 |
|
|
15 |
array<string> projectIds; |
|
16 |
} |
|
17 |
} |
|
18 |
|
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/statistics/AuthorToAuthorStatistics.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.statistics.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "AuthorStatistics.avdl"; |
|
5 |
|
|
6 |
record AuthorToAuthorStatistics { |
|
7 |
// ID of the author, foreign key: Person.id ("person" data store) |
|
8 |
string authorId; |
|
9 |
|
|
10 |
AuthorStatistics statistics; |
|
11 |
} |
|
12 |
|
|
13 |
} |
|
14 |
|
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/statistics/CoreStatistics.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.statistics.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "ExtendedStatistics.avdl"; |
|
5 |
|
|
6 |
// core statistics for a group of documents; |
|
7 |
// for example documents of a given author, |
|
8 |
// documents of a given project or all documents in the system |
|
9 |
record CoreStatistics { |
|
10 |
|
|
11 |
int numberOfPapers; |
|
12 |
|
|
13 |
// extended statistics containing |
|
14 |
// counts of citations FROM all papers |
|
15 |
ExtendedStatistics citationsFromAllPapers; |
|
16 |
|
|
17 |
// extended statistics containing |
|
18 |
// counts of citations FROM published papers |
|
19 |
ExtendedStatistics citationsFromPublishedPapers; |
|
20 |
|
|
21 |
} |
|
22 |
|
|
23 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/statistics/PersonId.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.statistics.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record PersonId { |
|
5 |
string id; |
|
6 |
} |
|
7 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/statistics/ProjectId.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.statistics.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record ProjectId { |
|
5 |
string id; |
|
6 |
} |
|
7 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/statistics/BasicCitationStatistics.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.statistics.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
// statistics containing total citation counts |
|
5 |
// suitable for a single document, person, project or global |
|
6 |
record BasicCitationStatistics { |
|
7 |
|
|
8 |
int numberOfCitations; |
|
9 |
|
|
10 |
// keys: years |
|
11 |
map<int> numberOfCitationsPerYear; |
|
12 |
|
|
13 |
} |
|
14 |
|
|
15 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/referenceextraction/researchinitiative/DocumentToConceptId.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.referenceextraction.researchinitiative.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record DocumentToConceptId { |
|
5 |
// document ID, foreign key: DocumentText.id |
|
6 |
string documentId; |
|
7 |
string conceptId; |
|
8 |
// Find more details on `confidenceLevel` constraints in eu/dnetlib/iis/README.markdown file. |
|
9 |
union { null , float } confidenceLevel = null; |
|
10 |
} |
|
11 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/referenceextraction/dataset/DocumentToDataSet.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.referenceextraction.dataset.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record DocumentToDataSet { |
|
5 |
// document ID, foreign key: DocumentText.id |
|
6 |
string documentId; |
|
7 |
// dataset ID, foreign key: DataSetReference.id |
|
8 |
string datasetId; |
|
9 |
// Find more details on `confidenceLevel` constraints in eu/dnetlib/iis/README.markdown file. |
|
10 |
union { null , float } confidenceLevel = null; |
|
11 |
} |
|
12 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/referenceextraction/project/DocumentToProject.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.referenceextraction.project.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record DocumentToProject { |
|
5 |
// document identifier, foreign key: DocumentWithBasicMetadata.id ("document basic metadata" data store) |
|
6 |
string documentId; |
|
7 |
// identifier of project being funding source of this document, |
|
8 |
// foreign key: Project.id |
|
9 |
string projectId; |
|
10 |
// Find more details on `confidenceLevel` constraints in eu/dnetlib/iis/README.markdown file. |
|
11 |
union { null , float } confidenceLevel = null; |
|
12 |
} |
|
13 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/importer/Concept.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.importer.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record Concept { |
|
5 |
string id; |
|
6 |
string label; |
|
7 |
map<string> params; |
|
8 |
} |
|
9 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/importer/DocumentRelation.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.importer.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record DocumentRelation { |
|
5 |
// document identifier |
|
6 |
// foreign key: DocumentMetadata.id ("raw document metadata" data store) |
|
7 |
string id; |
|
8 |
// document or dataset ids linked with 'resultResult' relation |
|
9 |
array<string> referencedIds; |
|
10 |
} |
|
11 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/importer/DocumentMetadata.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.importer.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record PublicationType { |
|
5 |
boolean article = false; |
|
6 |
boolean dataset = false; |
|
7 |
} |
|
8 |
|
|
9 |
record DocumentMetadata { |
|
10 |
// document identifier |
|
11 |
string id; |
|
12 |
|
|
13 |
// moved from DocumentBasicMetadata |
|
14 |
// title |
|
15 |
union { null , string } title = null; |
|
16 |
// abstract or description |
|
17 |
union { null , string } abstract = null; |
|
18 |
union { null , string } language = null; |
|
19 |
// list of keywords (free form) |
|
20 |
union { null , array<string> } keywords = null; |
|
21 |
// alternative identifier (e.g. internal publisher's identifiers) |
|
22 |
union { null , map<string> } externalIdentifiers = null; |
|
23 |
// name of journal in which the article is published |
|
24 |
union { null , string } journal = null; |
|
25 |
// year of publication |
|
26 |
union { null , int } year = null; |
|
27 |
// publisher name |
|
28 |
union { null , string } publisher = null; |
|
29 |
// end of: moved from DocumentBasicMetadata |
|
30 |
// publication type |
|
31 |
PublicationType publicationType; |
|
32 |
|
|
33 |
// foreign key: Person.id ("raw person" data store) |
|
34 |
union { null , array<string> } authorIds = null; |
|
35 |
|
|
36 |
// identifiers of datasources given document originates from |
|
37 |
union { null , array<string> } datasourceIds = null; |
|
38 |
|
|
39 |
} |
|
40 |
|
|
41 |
} |
|
42 |
|
|
43 |
|
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/importer/DocumentToMDStore.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.importer.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record DocumentToMDStore { |
|
5 |
// document identifier, foreign key: DocumentMetadata.id ("document metadata" data store) |
|
6 |
string documentId; |
|
7 |
// identifier of mdstore holding document identified with documentId |
|
8 |
string mdStoreId; |
|
9 |
} |
|
10 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/importer/WebsiteUserAction.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.importer.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
enum ActionType { |
|
5 |
CLICK, MODIFY |
|
6 |
} |
|
7 |
|
|
8 |
record WebsiteUserAction { |
|
9 |
// ID of the action |
|
10 |
int id; |
|
11 |
// type of action performed |
|
12 |
ActionType actionType; |
|
13 |
// identifier of a user's session |
|
14 |
union { null , string } sessionKey = null; |
|
15 |
// identifier of the user performing the action |
|
16 |
union { null , string } userId = null; |
|
17 |
// IP address from which the action was performed |
|
18 |
union { null , string } ipAddress = null; |
|
19 |
union { null , int } timestamp = null; |
|
20 |
union { null , string } referrer = null; |
|
21 |
union { null , string } details = null; |
|
22 |
// some other properties to be specified by NKUA |
|
23 |
} |
|
24 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/importer/auxiliary/DocumentContentUrl.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.importer.auxiliary.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record DocumentContentUrl { |
|
5 |
// document identifier |
|
6 |
string id; |
|
7 |
string url; |
|
8 |
union { null , string } mimeType = null; |
|
9 |
union { null , string } contentChecksum = null; |
|
10 |
union { null , long } contentSizeKB = null; |
|
11 |
} |
|
12 |
|
|
13 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/importer/auxiliary/PersonDuplicate.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.importer.auxiliary.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
import idl "../Person.avdl"; |
|
5 |
|
|
6 |
record PersonDuplicate { |
|
7 |
// pointer to an appropriate representative object of |
|
8 |
// this duplicate in the "raw person" data store |
|
9 |
string representativeId; |
|
10 |
// Information about person held by the duplicate object. |
|
11 |
// The data.id identifier is unique among all IDs stored in |
|
12 |
// the "raw person" and "raw person duplicate" data stores. |
|
13 |
union { null , eu.dnetlib.iis.importer.schemas.Person } data = null; |
|
14 |
} |
|
15 |
} |
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/importer/DataSetReference.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.importer.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record DataSetReference { |
|
5 |
// a technical ID of a data set reference (primary key) |
|
6 |
string id; |
|
7 |
// type name of the referenced id, e.g. doi |
|
8 |
string referenceType; |
|
9 |
// Data set identifier. Its definition follows the convention of a given data set |
|
10 |
// reference type defined by "referenceType" |
|
11 |
string idForGivenType; |
|
12 |
// Note that the ("typeID", "idForGivenType") pair unambiguously identifies a data |
|
13 |
// set, this is also true for the "id" field, i.e. ("typeID", "idForGivenType") is |
|
14 |
// a candidate key; "id" is also a candidate key. |
|
15 |
|
|
16 |
// additional fields |
|
17 |
union { null , array<string> } creatorNames = null; |
|
18 |
union { null , array<string> } titles = null; |
|
19 |
union { null , string } description = null; |
|
20 |
union { null , string } publisher = null; |
|
21 |
union { null , string } publicationYear = null; |
|
22 |
union { null , array<string> } formats = null; |
|
23 |
union { null , string } resourceTypeClass = null; |
|
24 |
union { null , string } resourceTypeValue = null; |
|
25 |
} |
|
26 |
} |
|
27 |
|
modules/icm-iis-schemas/trunk/src/main/resources/eu/dnetlib/iis/importer/Person.avdl | ||
---|---|---|
1 |
@namespace("eu.dnetlib.iis.importer.schemas") |
|
2 |
protocol IIS{ |
|
3 |
|
|
4 |
record Person { |
|
5 |
// person identifier |
Also available in: Unified diff
introducing dnet45 version of IIS CDH4 legacy libs