51 lines
1.5 KiB
Python
51 lines
1.5 KiB
Python
|
from io import BytesIO
|
||
|
import os
|
||
|
|
||
|
import pytest
|
||
|
|
||
|
import pandas.util._test_decorators as td
|
||
|
|
||
|
from pandas import read_csv
|
||
|
import pandas._testing as tm
|
||
|
|
||
|
|
||
|
def test_streaming_s3_objects():
|
||
|
# GH17135
|
||
|
# botocore gained iteration support in 1.10.47, can now be used in read_*
|
||
|
pytest.importorskip("botocore", minversion="1.10.47")
|
||
|
from botocore.response import StreamingBody
|
||
|
|
||
|
data = [b"foo,bar,baz\n1,2,3\n4,5,6\n", b"just,the,header\n"]
|
||
|
for el in data:
|
||
|
body = StreamingBody(BytesIO(el), content_length=len(el))
|
||
|
read_csv(body)
|
||
|
|
||
|
|
||
|
@td.skip_if_no("s3fs")
|
||
|
@pytest.mark.network
|
||
|
@tm.network
|
||
|
def test_read_without_creds_from_pub_bucket():
|
||
|
# GH 34626
|
||
|
# Use Amazon Open Data Registry - https://registry.opendata.aws/gdelt
|
||
|
result = read_csv("s3://gdelt-open-data/events/1981.csv", nrows=3)
|
||
|
assert len(result) == 3
|
||
|
|
||
|
|
||
|
@td.skip_if_no("s3fs")
|
||
|
@pytest.mark.network
|
||
|
@tm.network
|
||
|
def test_read_with_creds_from_pub_bucket():
|
||
|
# Ensure we can read from a public bucket with credentials
|
||
|
# GH 34626
|
||
|
# Use Amazon Open Data Registry - https://registry.opendata.aws/gdelt
|
||
|
|
||
|
with tm.ensure_safe_environment_variables():
|
||
|
# temporary workaround as moto fails for botocore >= 1.11 otherwise,
|
||
|
# see https://github.com/spulec/moto/issues/1924 & 1952
|
||
|
os.environ.setdefault("AWS_ACCESS_KEY_ID", "foobar_key")
|
||
|
os.environ.setdefault("AWS_SECRET_ACCESS_KEY", "foobar_secret")
|
||
|
df = read_csv(
|
||
|
"s3://gdelt-open-data/events/1981.csv", nrows=5, sep="\t", header=None
|
||
|
)
|
||
|
assert len(df) == 5
|