Revision 53267
Added by Miriam Baglioni over 5 years ago
BulkTaggingMapper.java | ||
---|---|---|
1 | 1 |
package eu.dnetlib.data.mapreduce.hbase.bulktag; |
2 | 2 |
|
3 |
import com.google.common.base.Splitter; |
|
4 |
import com.google.common.collect.Lists; |
|
3 | 5 |
import eu.dnetlib.data.bulktag.CommunityConfiguration; |
4 | 6 |
import eu.dnetlib.data.bulktag.CommunityConfigurationFactory; |
5 | 7 |
import eu.dnetlib.data.proto.FieldTypeProtos; |
... | ... | |
36 | 38 |
System.out.println("conf = " + conf); |
37 | 39 |
cc = CommunityConfigurationFactory.fromJson(conf); |
38 | 40 |
tagger = new ResultTagger(); |
41 |
tagger.setTrust(context.getConfiguration().get("bulktagging.trust", "0.85")); |
|
39 | 42 |
} |
40 | 43 |
|
41 | 44 |
@Override |
... | ... | |
57 | 60 |
long tagged = oaf.getEntity().getResult().getMetadata().getContextList().stream() |
58 | 61 |
.flatMap(c -> c.getDataInfoList().stream()) |
59 | 62 |
.map(FieldTypeProtos.DataInfo::getInferenceprovenance) |
60 |
.filter(infProv -> "bulktagging::community".equals(infProv))
|
|
63 |
.filter(infProv -> "bulktagging".equals(infProv)) |
|
61 | 64 |
.count(); |
62 | 65 |
context.getCounter("Bulk Tagging", " bulktagged ").increment(tagged); |
63 | 66 |
|
Also available in: Unified diff
modification for using trust as parameter of the configuration of the hodoop job and change in the provenance