Project

General

Profile

1
{ 
2
	"wf" : { 
3
        "threshold" : "0.99", 
4
        "run" : "001", 
5
        "entityType" : "result", 
6
        "orderField" : "title", 
7
        "queueMaxSize" : "2000",
8
        "groupMaxSize" : "10",
9
        "slidingWindowSize" : "200",
10
        "rootBuilder" : [ "result" ],
11
        "includeChildren" : "true" 
12
    },
13
	"pace" : {		
14
		"clustering" : [
15
			{ "name" : "acronyms", "fields" : [ "title" ], "params" : { "max" : "1", "minLen" : "2", "maxLen" : "4"} },
16
			{ "name" : "ngrampairs", "fields" : [ "title" ], "params" : { "max" : "1", "ngramLen" : "3"} },
17
			{ "name" : "suffixprefix", "fields" : [ "title" ], "params" : { "max" : "1", "len" : "3" } } 
18
		],		
19
		"strictConditions" : [
20
  			{ "name" : "doiExactMatch", "fields" : [ "pid" ] }
21
  		], 
22
  		"conditions" : [ 
23
  			{ "name" : "yearMatch", "fields" : [ "dateofacceptance" ] },
24
  			{ "name" : "titleVersionMatch", "fields" : [ "title" ] },
25
  			{ "name" : "sizeMatch", "fields" : [ "authors" ] } 
26
  		],		
27
		"model" : [
28
			{ "name" : "pid", "algo" : "Null", "type" : "String", "weight" : "0.0", "ignoreMissing" : "true", "path" : "pid[qualifier#classid = {doi}]/value", "overrideMatch" : "true" }, 	
29
			{ "name" : "title", "algo" : "JaroWinkler", "type" : "String", "weight" : "1.0", "ignoreMissing" : "false", "path" : "result/metadata/title[qualifier#classid = {main title}]/value" },
30
			{ "name" : "dateofacceptance", "algo" : "Null", "type" : "String", "weight" : "0.0", "ignoreMissing" : "true", "path" : "result/metadata/dateofacceptance/value" } ,
31
			{ "name" : "authors", "algo" : "Null", "type" : "String", "weight" : "0.0", "ignoreMissing" : "true", "path" : "result/author/metadata/fullname/value" } 		
32
		],
33
		"blacklists" : {
34
			"title" : [
35
				"^(Corpus Oral Dialectal \\(COD\\)\\.).*$",
36
				"^(Kiri Karl Morgensternile).*$",
37
				"^(\\[Eksliibris Aleksandr).*\\]$",
38
				"^(\\[Eksliibris Aleksandr).*$",
39
				"^(Eksliibris Aleksandr).*$",
40
				"^(Kiri A\\. de Vignolles).*$",
41
				"^(2 kirja Karl Morgensternile).*$",
42
				"^(Pirita kloostri idaosa arheoloogilised).*$",
43
				"^(Kiri tundmatule).*$",
44
				"^(Kiri Jenaer Allgemeine Literaturzeitung toimetusele).*$",
45
				"^(Eksliibris Nikolai Birukovile).*$",
46
				"^(Eksliibris Nikolai Issakovile).*$",
47
				"^(WHP Cruise Summary Information of section).*$",
48
				"^(Measurement of the top quark\\-pair production cross section with ATLAS in pp collisions at).*$",
49
				"^(Measurement of the spin\\-dependent structure function).*"
50
			] } 		
51
	}
52

    
53
}
(4-4/7)