forked from mozilla/bigquery-etl
-
Notifications
You must be signed in to change notification settings - Fork 0
/
conftest.py
105 lines (75 loc) · 2.59 KB
/
conftest.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
"""PyTest configuration."""
import os
import random
import string
import subprocess
from pathlib import Path
import pytest
from google.cloud import bigquery, storage
TEST_BUCKET = "bigquery-etl-integration-test-bucket"
pytest_plugins = [
"bigquery_etl.pytest_plugin.sql",
"bigquery_etl.pytest_plugin.routine",
"bigquery_etl.pytest_plugin.script_lint.black",
"bigquery_etl.pytest_plugin.script_lint.docstyle",
"bigquery_etl.pytest_plugin.script_lint.flake8",
"bigquery_etl.pytest_plugin.script_lint.mypy",
]
def pytest_collection_modifyitems(config, items):
keywordexpr = config.option.keyword
markexpr = config.option.markexpr
if keywordexpr or markexpr:
return
skip_integration = pytest.mark.skip(reason="integration marker not selected")
for item in items:
if "integration" in item.keywords:
item.add_marker(skip_integration)
@pytest.fixture
def project_id():
"""Provide a BigQuery project ID."""
# GOOGLE_PROJECT_ID needs to be set for integration tests to run
project_id = os.environ["GOOGLE_PROJECT_ID"]
return project_id
@pytest.fixture
def bigquery_client():
"""Provide a BigQuery client."""
project_id = os.environ["GOOGLE_PROJECT_ID"]
return bigquery.Client(project_id)
@pytest.fixture
def temporary_dataset():
"""Fixture for creating a random temporary BigQuery dataset."""
# generate a random test dataset to avoid conflicts when running tests in parallel
test_dataset = "test_" + "".join(
random.choice(string.ascii_lowercase) for i in range(12)
)
project_id = os.environ["GOOGLE_PROJECT_ID"]
client = bigquery.Client(project_id)
client.create_dataset(test_dataset)
yield test_dataset
# cleanup and remove temporary dataset
client.delete_dataset(test_dataset, delete_contents=True, not_found_ok=True)
@pytest.fixture
def test_bucket():
"""Provide a test bucket instance."""
storage_client = storage.Client()
bucket = storage_client.bucket(TEST_BUCKET)
yield bucket
@pytest.fixture
def temporary_gcs_folder():
"""Provide a temporary folder in the GCS test bucket."""
test_folder = (
"test_"
+ "".join(random.choice(string.ascii_lowercase) for i in range(12))
+ "/"
)
yield test_folder
storage_client = storage.Client()
bucket = storage_client.bucket(TEST_BUCKET)
# delete test folder
blobs = bucket.list_blobs(prefix=test_folder)
for blob in blobs:
blob.delete()
@pytest.fixture
def storage_client():
"""Provide a client instance for cloud storage."""
yield storage.Client()