* Connector health: source hubspot, gitlab, snapchat-marketing: fix builds
* Add stream ShippingRates
* #2363 source mixpanel: reimplement backoff strategy
* #2363 source mixpanel: upd changelog
* #2363 source mixpanel: revert v0.1.32
* rework rate limits
* wait only when running CAT + increase timeouts
* #2363 return backoff time
* code format
* use env variable instead of a hidden field in the config
* review comments
* review fixes
* fix reading env var
* Resolve conflicts, Bump version
* Attempt to bump version to avoid caching
* split test config into to projects
* rollback version
* undo non related changes
* remove non related changes
* revert new line
* fix funnel slice patching
* fix funnel slice patching
* do not use stream state for generating request params!
* fix updating state
* Revert "do not use stream state for generating request params!"
This reverts commit 443781eaa9.
* revert prev commits
* fix timestamp filtering
---------
Co-authored-by: btkcodedev <btk.codedev@gmail.com>
Co-authored-by: Augustin <augustin@airbyte.io>
Co-authored-by: maxi297 <maxime@airbyte.io>
138 lines
6.0 KiB
Python
138 lines
6.0 KiB
Python
#
|
|
# Copyright (c) 2023 Airbyte, Inc., all rights reserved.
|
|
#
|
|
|
|
import base64
|
|
import json
|
|
import logging
|
|
import os
|
|
from typing import Any, List, Mapping, Tuple
|
|
|
|
import pendulum
|
|
import requests
|
|
from airbyte_cdk.logger import AirbyteLogger
|
|
from airbyte_cdk.sources import AbstractSource
|
|
from airbyte_cdk.sources.streams import Stream
|
|
from airbyte_cdk.sources.streams.http.auth import BasicHttpAuthenticator, TokenAuthenticator
|
|
|
|
from .streams import Annotations, CohortMembers, Cohorts, Engage, Export, Funnels, Revenue
|
|
from .testing import adapt_streams_if_testing, adapt_validate_if_testing
|
|
from .utils import read_full_refresh
|
|
|
|
|
|
class TokenAuthenticatorBase64(TokenAuthenticator):
|
|
def __init__(self, token: str):
|
|
token = base64.b64encode(token.encode("utf8")).decode("utf8")
|
|
super().__init__(token=token, auth_method="Basic")
|
|
|
|
|
|
class SourceMixpanel(AbstractSource):
|
|
STREAMS = [Cohorts, CohortMembers, Funnels, Revenue, Export, Annotations, Engage]
|
|
|
|
def get_authenticator(self, config: Mapping[str, Any]) -> TokenAuthenticator:
|
|
credentials = config.get("credentials")
|
|
if credentials:
|
|
username = credentials.get("username")
|
|
secret = credentials.get("secret")
|
|
if username and secret:
|
|
return BasicHttpAuthenticator(username=username, password=secret)
|
|
return TokenAuthenticatorBase64(token=credentials["api_secret"])
|
|
return TokenAuthenticatorBase64(token=config["api_secret"])
|
|
|
|
@adapt_validate_if_testing
|
|
def _validate_and_transform(self, config: Mapping[str, Any]):
|
|
logger = logging.getLogger("airbyte")
|
|
source_spec = self.spec(logger)
|
|
default_project_timezone = source_spec.connectionSpecification["properties"]["project_timezone"]["default"]
|
|
config["project_timezone"] = pendulum.timezone(config.get("project_timezone", default_project_timezone))
|
|
|
|
today = pendulum.today(tz=config["project_timezone"]).date()
|
|
start_date = config.get("start_date")
|
|
if start_date:
|
|
config["start_date"] = pendulum.parse(start_date).date()
|
|
else:
|
|
config["start_date"] = today.subtract(days=365)
|
|
|
|
end_date = config.get("end_date")
|
|
if end_date:
|
|
config["end_date"] = pendulum.parse(end_date).date()
|
|
else:
|
|
config["end_date"] = today
|
|
|
|
for k in ["attribution_window", "select_properties_by_default", "region", "date_window_size"]:
|
|
if k not in config:
|
|
config[k] = source_spec.connectionSpecification["properties"][k]["default"]
|
|
|
|
auth = self.get_authenticator(config)
|
|
if isinstance(auth, TokenAuthenticatorBase64) and "project_id" in config:
|
|
config.pop("project_id")
|
|
elif isinstance(auth, BasicHttpAuthenticator) and "project_id" not in config:
|
|
raise ValueError("missing required parameter 'project_id'")
|
|
|
|
return config
|
|
|
|
def check_connection(self, logger: AirbyteLogger, config: Mapping[str, Any]) -> Tuple[bool, any]:
|
|
"""
|
|
See https://github.com/airbytehq/airbyte/blob/master/airbyte-integrations/connectors/source-stripe/source_stripe/source.py#L232
|
|
for an example.
|
|
|
|
:param config: the user-input config object conforming to the connector's spec.json
|
|
:param logger: logger object
|
|
:return Tuple[bool, any]: (True, None) if the input config can be used to connect to the API successfully, (False, error) otherwise.
|
|
"""
|
|
try:
|
|
config = self._validate_and_transform(config)
|
|
auth = self.get_authenticator(config)
|
|
except Exception as e:
|
|
return False, e
|
|
|
|
# https://github.com/airbytehq/airbyte/pull/27252#discussion_r1228356872
|
|
# temporary solution, testing access for all streams to avoid 402 error
|
|
stream_kwargs = {"authenticator": auth, "reqs_per_hour_limit": 0, **config}
|
|
reason = None
|
|
for stream_class in self.STREAMS:
|
|
try:
|
|
stream = stream_class(**stream_kwargs)
|
|
next(read_full_refresh(stream), None)
|
|
return True, None
|
|
except requests.HTTPError as e:
|
|
try:
|
|
reason = e.response.json()["error"]
|
|
except json.JSONDecoder:
|
|
reason = e.response.content
|
|
if e.response.status_code != 402:
|
|
return False, reason
|
|
logger.info(f"Stream {stream_class.__name__}: {e.response.json()['error']}")
|
|
except Exception as e:
|
|
return False, str(e)
|
|
return False, reason
|
|
|
|
@adapt_streams_if_testing
|
|
def streams(self, config: Mapping[str, Any]) -> List[Stream]:
|
|
"""
|
|
:param config: A Mapping of the user input configuration as defined in the connector spec.
|
|
"""
|
|
config = self._validate_and_transform(config)
|
|
logger = logging.getLogger("airbyte")
|
|
logger.info(f"Using start_date: {config['start_date']}, end_date: {config['end_date']}")
|
|
|
|
auth = self.get_authenticator(config)
|
|
stream_kwargs = {"authenticator": auth, "reqs_per_hour_limit": 0, **config}
|
|
streams = []
|
|
for stream_cls in self.STREAMS:
|
|
stream = stream_cls(**stream_kwargs)
|
|
try:
|
|
stream.get_json_schema()
|
|
next(read_full_refresh(stream), None)
|
|
except requests.HTTPError as e:
|
|
if e.response.status_code != 402:
|
|
raise e
|
|
logger.warning("Stream '%s' - is disabled, reason: 402 Payment Required", stream.name)
|
|
else:
|
|
reqs_per_hour_limit = int(os.environ.get("REQS_PER_HOUR_LIMIT", stream.DEFAULT_REQS_PER_HOUR_LIMIT))
|
|
# We preserve sleeping between requests in case this is not a running acceptance test.
|
|
# Otherwise, we do not want to wait as each API call is followed by sleeping ~60 seconds.
|
|
stream.reqs_per_hour_limit = reqs_per_hour_limit
|
|
streams.append(stream)
|
|
return streams
|