diff --git a/coordinator/ProcessorSurveysnewODK2.py b/coordinator/ProcessorSurveysnewODK2.py index 8591c47b57c51f8ede47d8eee91feffec5915cc8..02533a361babc6bcd434d6de976652e95850698e 100644 --- a/coordinator/ProcessorSurveysnewODK2.py +++ b/coordinator/ProcessorSurveysnewODK2.py @@ -27,6 +27,27 @@ logger = logging.getLogger('Processor.Surveys.kobotoolbox') add_filters_to_sublogger(logger) +# Downloads of the ODK form reports country descriptions as two letter codes. +# The reason is unclear, as viewing online shows full country names. To be +# consistent across all form types, this function is available for translating +# two letter codes to full string names. +# Only some have these have been checked explicitly against downloaded surveys. +# Assuming the code is based on ISO 3166-1 alpha-2 +COUNTRY_ABBREVIATIONS_DICT = { + 'AF' : 'Afghanistan', + 'BD' : 'Bangladesh', + 'BT' : 'Bhutan', + 'ET' : 'Ethiopia', + 'IN' : 'India', + 'KE' : 'Kenya', + 'NP' : 'Nepal', + 'PK' : 'Pakistan', + 'TZ' : 'Tanzania', + 'UG' : 'Uganda', + 'ZM' : 'Zambia', + 'ZW' : 'Zimbabwe', + } + def get_newODK2_form_as_csv(form_credentials: dict, jobPath: str, config: dict, status): '''Given a dict with a single kobotoolbox form to download from a kobotoolbox server, obtains it and converts to csv.''' @@ -54,7 +75,7 @@ def get_newODK2_form_as_csv(form_credentials: dict, jobPath: str, config: dict, #'phonenumber' : 'None', 'username' : 'username', 'surveyor_information/region' : 'None', - 'surveyor_information/country' : 'surveyor_infromation-country', + 'surveyor_information/country' : ('parse_cases',(('name_out','surveyor_infromation-country'),('cases', COUNTRY_ABBREVIATIONS_DICT))), 'surveyor_information/surveyor' : 'surveyor_infromation-surveyor_name', 'surveyor_information/institution' : 'surveyor_infromation-institution', 'survey_information/admin_level_1' : 'None',