/ - Diff - BIEN 3 - NCEAS Projects

« Previous | Next »

Revision 14540

Added by Aaron Marcuse-Kubitza over 10 years ago

lib/tnrs.py: added option to avoid using TNRS's TSV export feature, which currently returns incorrect selected matches (vegpath.org/issues/943). this has been implemented up through the GWT/JSON decoding.

     # TNRS
     import json
     import os.path
     import re
     import sys
-...
                 +response)
         return match.groups()
     def single_tnrs_request(names, debug=False, cumulative_profiler=None):
     def single_tnrs_request(names, debug=False, cumulative_profiler=None,
         use_tnrs_export=True):
         '''
         Note that names containing only whitespace characters (after gwt_encode())
         are ignored by TNRS and do not receive a response row. Thus, you should
         always match up the Name_submitted returned by TNRS with the actual
         submitted name to determine the corresponding TNRS response row.
         @param use_tnrs_export whether to use TNRS's TSV export feature, which
             currently returns incorrect selected matches (vegpath.org/issues/943)
         '''
         name_ct = len(names)
         assert name_ct <= max_names
-...
             # lengths depending on the taxonomic ranks present in the provided taxon
             # name. the extra download step is therefore necessary.
             debug_log('Prepare download')
             request = download_request_template.replace('[key]', key_enc)
             response, response_info = do_request(request)
             csv_url, = parse_response('download', download_response_pattern,
                 response, response, response_info)
             csv_url += download_url_suffix
             debug_log('csv_url', csv_url)
             debug_log('Download')
             request_obj = urllib2.Request(csv_url)
             debug_log('request URL', str(csv_url))
             debug_log('request info', str(request_obj.header_items()))
             debug_log('request str', str(request_obj.get_data()))
             response = urllib2.urlopen(request_obj)
             response_info = str(response.info())
             debug_log('response info', response_info)
             return TnrsOutputStream(response)
             if use_tnrs_export:
                 debug_log('Prepare download')
                 request = download_request_template.replace('[key]', key_enc)
                 response, response_info = do_request(request)
                 csv_url, = parse_response('download', download_response_pattern,
                     response, response, response_info)
                 csv_url += download_url_suffix
                 debug_log('csv_url', csv_url)
                 debug_log('Download')
                 request_obj = urllib2.Request(csv_url)
                 debug_log('request URL', str(csv_url))
                 debug_log('request info', str(request_obj.header_items()))
                 debug_log('request str', str(request_obj.get_data()))
                 response = urllib2.urlopen(request_obj)
                 response_info = str(response.info())
                 debug_log('response info', response_info)
                 return TnrsOutputStream(response)
             else:
                 debug_log('Expand')
                 request = ('7|0|6|http://tnrs.iplantcollaborative.org/tnrsdemo/|\
 E87C78041CEFBF0992F46BDF84D7D60|org.iplantc.tnrs.demo.client.SearchService|\
     requestGroupMembers|java.lang.String/2004016611|{"group":"0", \
     "email":"tnrs@lka5jjs.orv", "key":"[key]", "source_sorting":"false", \
     "taxonomic_constraint":"false"}|1|2|3|4|1|5|6|'.replace('[key]', key_enc))
                 response, response_info = do_request(request)
                 data_gwt, = parse_response('expand', r'^//OK\[1,\["(.*)"\],0,7\]$',
                     response, response, response_info)
                 data_json = json.loads(gwt_decode(data_gwt))
                 raise NotImplementedError()
         finally:
             profiler.stop(name_ct)
             sys.stderr.write(profiler.msg()+'\n')

Also available in: Unified diff

Project

General

Profile

Revision 14540

Added by Aaron Marcuse-Kubitza over 10 years ago