Source code for bradata.tse.utils_tse

import os
import glob
import pandas as pd
import bradata.connection
from bradata.utils import  _unzip, _set_download_directory


[docs]def unzip_tse(result, current_path):

    if not os.path.exists(current_path):
        os.makedirs(current_path)

    with open(current_path + 'temp.zip', 'wb') as f:
        f.write(result)

    _unzip(current_path + 'temp.zip', current_path)

    os.remove(current_path + 'temp.zip')

[docs]def aggregate_tse(path, type, year):

    year =  year
    files = glob.glob("{}/*_{}_*.txt".format(path, year))

    headers = pd.read_csv(os.getcwd() + '/bradata/tse/headersTSE.csv')



    df_list = []
    print(files)
    for filename in sorted(files):
        if type == 'candidatos':
            if year >= 2014:
                header = 'CONSULTA_CAND_2014'
            elif year == 2012:
                header = 'CONSULTA_CAND_2012'
            elif year <= 2010:
                header = 'CONSULTA_CAND_2010'
            df_list.append(
                pd.read_csv(filename, sep=';', names=headers[header].dropna().tolist(), encoding='latin1'))

    full_df = pd.concat(df_list)

    full_df.to_csv(path + '/{}/{}_{}.csv'.format(type, type, year))

[docs]def download_headers():

    result = bradata.connection.Connection().perform_request('https://gist.github.com/JoaoCarabetta/e2bf8437007efec84c3110cb93941850',
                                                             binary = True)
    if result['status'] == 'ok':
        result = result['content']
    else:
        print('File was not dowloaded')

    unzip_tse(result, _set_download_directory())