-
-
Save edson-github/52f0c5b523eb29a72d52aa12f2b4faa8 to your computer and use it in GitHub Desktop.
Exemplo de código para acessar dados do Brasil.IO
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| import csv | |
| import gzip | |
| import io | |
| import json | |
| from urllib.parse import urlencode, urljoin | |
| from urllib.request import Request, urlopen | |
| class BrasilIO: | |
| base_url = "https://api.brasil.io/v1/" | |
| def __init__(self, auth_token): | |
| self.__auth_token = auth_token | |
| @property | |
| def headers(self): | |
| return { | |
| "User-Agent": "python-urllib/brasilio-client-0.1.0", | |
| } | |
| @property | |
| def api_headers(self): | |
| data = self.headers | |
| data.update({"Authorization": f"Token {self.__auth_token}"}) | |
| return data | |
| def api_request(self, path, query_string=None): | |
| url = urljoin(self.base_url, path) | |
| if query_string: | |
| url += "?" + urlencode(query_string) | |
| request = Request(url, headers=self.api_headers) | |
| response = urlopen(request) | |
| return json.load(response) | |
| def data(self, dataset_slug, table_name, filters=None): | |
| url = f"dataset/{dataset_slug}/{table_name}/data/" | |
| filters = filters or {} | |
| filters["page"] = 1 | |
| finished = False | |
| while not finished: | |
| response = self.request(url, filters) | |
| next_page = response.get("next", None) | |
| for row in response["results"]: | |
| yield row | |
| filters = {} | |
| url = next_page | |
| finished = next_page is None | |
| def download(self, dataset, table_name): | |
| url = f"https://data.brasil.io/dataset/{dataset}/{table_name}.csv.gz" | |
| request = Request(url, headers=self.headers) | |
| response = urlopen(request) | |
| return response | |
| if __name__ == "__main__": | |
| api = BrasilIO("meu-api-token") | |
| dataset_slug = "covid19" | |
| table_name = "caso_full" | |
| # Para baixar o arquivo completo: | |
| # Após fazer o download, você salvá-lo no disco ou percorrer o arquivo em | |
| # memória. Para salvá-lo no disco: | |
| response = api.download(dataset_slug, table_name) | |
| with open(f"{dataset_slug}_{table_name}.csv.gz", mode="wb") as fobj: | |
| fobj.write(response.read()) | |
| # TODO: o código acima pode ser melhorado de forma a não utilizar | |
| # `response.read()` para não colocar todo oarquivo em memória e sim fazer | |
| # streaming da resposta HTTP e salvar cada chunk diretamente no `fobj`. | |
| # Caso queira percorrer o CSV em memória: | |
| response = api.download(dataset_slug, table_name) | |
| fobj = io.TextIOWrapper(gzip.GzipFile(fileobj=response), encoding="utf-8") | |
| reader = csv.DictReader(fobj) | |
| for row in reader: | |
| pass # faça algo com `row` | |
| # Para navegar pela API: | |
| filters = {"state": "PR", "is_last": True} | |
| data = api.data(dataset_slug, table_name, filters) | |
| for row in data: | |
| pass # faça algo com `row` |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment