Project

General

Profile

1
{ 
2
	"wf" : { 
3
        "threshold" : "0.99", 
4
        "run" : "001", 
5
        "entityType" : "result", 
6
        "orderField" : "title", 
7
        "queueMaxSize" : "2000",
8
        "groupMaxSize" : "10",
9
        "slidingWindowSize" : "200",
10
        "rootBuilder" : [ "result" ],
11
        "includeChildren" : "true" 
12
    },
13
	"pace" : {		
14
		"clustering" : [
15
			{ "name" : "acronyms", "fields" : [ "title" ], "params" : { "max" : "1", "minLen" : "2", "maxLen" : "4"} },
16
			{ "name" : "ngrampairs", "fields" : [ "title" ], "params" : { "max" : "1", "ngramLen" : "3"} },
17
			{ "name" : "suffixprefix", "fields" : [ "title" ], "params" : { "max" : "1", "len" : "3" } } 
18
		],		
19
		"conditions" : [
20
  			{ "name" : "yearMatch", "fields" : [ "dateofacceptance" ] },
21
  			{ "name" : "titleVersionMatch", "fields" : [ "title" ] },
22
  			{ "name" : "sizeMatch", "fields" : [ "authors" ] } ,
23
				{ "name" : "pidMatch", "fields" : [ "pid" ] }
24
  		],		
25
		"model" : [
26
			{ "name" : "pid", "algo" : "Null", "type" : "JSON", "weight" : "0.0", "ignoreMissing" : "true", "path" : "pid", "overrideMatch" : "true" },
27
			{ "name" : "title", "algo" : "JaroWinkler", "type" : "String", "weight" : "1.0", "ignoreMissing" : "false", "path" : "publication/metadata/title[qualifier#classid = {main title}]/value" },
28
			{ "name" : "dateofacceptance", "algo" : "Null", "type" : "String", "weight" : "0.0", "ignoreMissing" : "true", "path" : "publication/metadata/dateofacceptance/value" } ,
29
			{ "name" : "authors", "algo" : "Null", "type" : "String", "weight" : "0.0", "ignoreMissing" : "true", "path" : "publication/author/metadata/fullname/value" }
30
		],
31
		"blacklists" : {
32
			"title" : [
33
				"^(Corpus Oral Dialectal \\(COD\\)\\.).*$",
34
				"^(Kiri Karl Morgensternile).*$",
35
				"^(\\[Eksliibris Aleksandr).*\\]$",
36
				"^(\\[Eksliibris Aleksandr).*$",
37
				"^(Eksliibris Aleksandr).*$",
38
				"^(Kiri A\\. de Vignolles).*$",
39
				"^(2 kirja Karl Morgensternile).*$",
40
				"^(Pirita kloostri idaosa arheoloogilised).*$",
41
				"^(Kiri tundmatule).*$",
42
				"^(Kiri Jenaer Allgemeine Literaturzeitung toimetusele).*$",
43
				"^(Eksliibris Nikolai Birukovile).*$",
44
				"^(Eksliibris Nikolai Issakovile).*$",
45
				"^(WHP Cruise Summary Information of section).*$",
46
				"^(Measurement of the top quark\\-pair production cross section with ATLAS in pp collisions at).*$",
47
				"^(Measurement of the spin\\-dependent structure function).*"
48
			] } 		
49
	}
50

    
51
}
(4-4/7)