/modules/dli-service-portal/trunk/eu/dnetlib/es_connector.py - Diff - D-Net - D-Net project tracking tool

« Previous | Next »

Revision 50035

Added by Sandro La Bruzzo over 6 years ago

made a new look

     from os import path
     def get_property():
     pid_resolver = {
         "pdb": "http://www.rcsb.org/pdb/explore/explore.do?structureId=%s",
         "ncbi-n": "http://www.ncbi.nlm.nih.gov/gquery/?term=%s",
         "pmid": "http://www.ncbi.nlm.nih.gov/pubmed/%s",
         "pmcid": "http://www.ncbi.nlm.nih.gov/pmc/articles/%s",
         "pubmedid": "http://www.ncbi.nlm.nih.gov/pubmed/%s",
         "doi": "http://dx.doi.org/%s",
         "genbank": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "nuccore": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "swiss-prot": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "arrayexpress": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "biomodels": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "bmrb": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "ena": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "geo": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "ensembl": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "mgi": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "bind": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "pride": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "ddbj": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "bioproject": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "embl": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
         "sra": "http://www.ncbi.nlm.nih.gov/nucest/%s?report=genbank",
+    }
     def resolveIdentifier(pid, pid_type):
         if pid_type!= None:
             if pid_type.lower() in  pid_resolver:
                 return pid_resolver[pid_type.lower()] % pid
             else:
                 if pid_type.lower() == 'openaire':
                     return "https://www.openaire.eu/search/publication?articleId=%s"%pid.replace('oai:dnet:','')
                 else:
                     return "http://identifiers.org/%s:%s" % (pid_type, pid)
         return ""
     def get_property():
         f = open(path.join(os.path.dirname(os.path.realpath(__file__)), '../../api.properties'))
         p = {}
         for line in f:
-...
             hits = []
             for index_result in response.hits:
                 hits.append(index_result.__dict__['_d_'])
                 input_source = index_result.__dict__['_d_']
                 fixed_titles = []
                 for ids in  input_source.get('localIdentifier',[]):
                     ds = resolveIdentifier(ids['id'], ids['type'])
                     ids['url'] = ds
                 for t in input_source.get('title',[]):
                     if len(t) > 0 and t[0] == '"' and t[-1] == '"':
                         fixed_titles.append(t[1:-1])
                     else:
                         fixed_titles.append(t)
                 input_source['title'] = fixed_titles
                 hits.append(input_source)
             pid_types = []
             for tag in response.aggs.all_pids.all_types.buckets:
                 pid_types.append(dict(key=tag.key, count=tag.doc_count))
-...
             return hits
         def fix_collectedFrom(self, source, relation):
             if relation is None:
                 return
             relSource = relation.get('source')
             collectedFrom = relSource['collectedFrom']
             for coll in collectedFrom:
-...
                 res = self.client.get(index=self.index_name, doc_type='object', id=id)
                 hits = []
                 input_source = res['_source']
                 fixed_titles = []
                 for t in input_source.get('title'):
                     if len(t) >0 and t[0]=='"' and t[-1]=='"':
                         fixed_titles.append(t[1:-1])
                     else:
                         fixed_titles.append(t)
                 input_source['title'] = fixed_titles
                 for ids in  input_source.get('localIdentifier',[]):
                     ds = resolveIdentifier(ids['id'], ids['type'])
                     ids['url'] = ds
                 related_publications = []
                 related_dataset = []
                 related_unknown = []
-...
                         related_publications = self.related_type(id, 'publication', start)
                     else:
                         related_publications = self.related_type(id, 'publication')
                     rel_source = related_publications[0]
                     if len(related_publications) >0 :
                         rel_source = related_publications[0]
                     else:
                         rel_source = {}
                 if input_source.get('relatedDatasets') > 0:
                     if 'dataset' == type:
                         related_dataset = self.related_type(id, 'dataset', start)

Also available in: Unified diff

Project

General

Profile

D-Net

Revision 50035

Added by Sandro La Bruzzo over 6 years ago