123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976 |
- import requests
- from urllib3.util.retry import Retry
- from requests.adapters import HTTPAdapter
- import json
- import time
- from cachetools import TTLCache
- from urllib.parse import urljoin
- from typing import List, Literal, Iterable, Iterator
- import gzip
- from pathlib import Path
- import s3fs
- from s3fs import S3FileSystem
- import logging
- URL_AUTH = "https://api.amazon.com/auth/o2/token"
- URL_AD_API = "https://advertising-api.amazon.com"
- cache = TTLCache(maxsize=10, ttl=3200)
- logger = logging.getLogger(__name__)
- class RateLimitError(Exception):
- def __init__(self, retry_after: str = None):
- self.retry_after = retry_after
- def gz_decompress(file_path: str, chunk_size: int = 1024 * 1024):
- decompressed_file = file_path.rstrip(".gz")
- with open(decompressed_file, "wb") as pw:
- zf = gzip.open(file_path, mode='rb')
- while True:
- chunk = zf.read(size=chunk_size)
- if not chunk:
- break
- pw.write(chunk)
- return decompressed_file
- class BaseClient:
- def __init__(
- self, lwa_client_id: str, lwa_client_secret: str, refresh_token: str = None, profile_id: str = None,
- data_path: str = "./"
- ):
- self.lwa_client_id = lwa_client_id
- self.lwa_client_secret = lwa_client_secret
- self.refresh_token = refresh_token
- self.profile_id = profile_id
- self.data_path = Path(data_path)
- if not self.data_path.exists():
- self.data_path.mkdir(parents=True)
- retry_strategy = Retry(
- total=5, # 重试次数
- allowed_methods=["GET", "POST"],
- # 强制重试的状态码,在method_whitelist中的请求方法才会重试
- status_forcelist=[429, 500, 502, 503, 504],
- raise_on_status=False, # 在status_forcelist中的状态码达到重试次数后是否抛出异常
- # backoff_factor * (2 ** (retry_time-1)), 即间隔1s, 2s, 4s, 8s, ...
- backoff_factor=2,
- )
- adapter = HTTPAdapter(max_retries=retry_strategy)
- self.session = requests.session()
- self.session.mount("https://", adapter)
- @property
- def access_token(self) -> str:
- try:
- return cache[self.refresh_token]
- except KeyError:
- resp = requests.post(URL_AUTH, data={
- "grant_type": "refresh_token",
- "client_id": self.lwa_client_id,
- "refresh_token": self.refresh_token,
- "client_secret": self.lwa_client_secret,
- })
- if resp.status_code != 200:
- raise Exception(resp.text)
- js = resp.json()
- cache[self.refresh_token] = js["access_token"]
- self.refresh_token = js["refresh_token"]
- return js["access_token"]
- @property
- def auth_headers(self):
- return {
- "Amazon-Advertising-API-ClientId": self.lwa_client_id,
- "Amazon-Advertising-API-Scope": self.profile_id,
- "Authorization": f"Bearer {self.access_token}",
- }
- def _request(self, url_path: str, method: str = "GET", headers: dict = None, params: dict = None,
- body: dict = None):
- head = self.auth_headers
- if headers:
- head.update(headers)
- resp = self.session.request(
- method=method,
- url=urljoin(URL_AD_API, url_path),
- headers=head,
- params=params,
- json=body,
- )
- if resp.status_code == 429:
- raise RateLimitError(resp.headers.get("Retry-After"))
- if resp.status_code >= 400:
- raise Exception(resp.text)
- return resp.json()
- def get_profilesInfo(self):
- url_path = "/v2/profiles"
- return self._request(url_path)
- class SPClient(BaseClient):
- def get_campaigns(self, **body):
- url_path = "/sp/campaigns/list"
- headers = {
- "Accept": "application/vnd.spcampaign.v3+json",
- "Content-Type": "application/vnd.spcampaign.v3+json"
- }
- return self._request(url_path, method="POST", headers=headers, body=body)
- def iter_campaigns(self, **body) -> Iterator[dict]:
- if "maxResults" not in body:
- body["maxResults"] = 100
- while True:
- info: dict = self.get_campaigns(**body)
- yield from info["campaigns"]
- if not info.get("nextToken"):
- break
- body["nextToken"] = info["nextToken"]
- logger.info(f"总共数量:{info['totalResults']}")
- def get_budgetrecommendation(self, campaign_ids):
- url_path = "/sp/campaigns/budgetRecommendations"
- body = {
- "campaignIds": campaign_ids
- }
- headers = {
- "Accept": "application/vnd.budgetrecommendation.v3+json",
- "Content-Type": "application/vnd.budgetrecommendation.v3+json"
- }
- return self._request(url_path, method="POST", headers=headers, body=body)
- def iter_budgetrecommendation(self,campaign_ids):
- for i in range(0,len(campaign_ids),100):
- campaign_id = campaign_ids[i:i+100]
- info: list = self.get_budgetrecommendation(campaign_id)
- yield from info["budgetRecommendationsSuccessResults"]
- def get_ad_groups(self, **body):
- url_path = "/sp/adGroups/list"
- headers = {
- "Accept": "application/vnd.spadGroup.v3+json",
- "Content-Type": "application/vnd.spadGroup.v3+json"
- }
- return self._request(url_path, method="POST", body=body, headers=headers)
- def iter_adGroups(self, **body) -> Iterator[dict]:
- if "maxResults" not in body:
- body["maxResults"] = 100
- while True:
- info: dict = self.get_ad_groups(**body)
- yield from info["adGroups"]
- if not info.get("nextToken"):
- break
- body["nextToken"] = info["nextToken"]
- logger.info(f"总共数量:{info['totalResults']}")
- def get_ads(self, **body):
- url_path = "/sp/productAds/list"
- headers = {
- "Accept": "application/vnd.spproductAd.v3+json",
- "Content-Type": "application/vnd.spproductAd.v3+json"
- }
- return self._request(url_path, method="POST", body=body, headers=headers)
- def iter_ads(self, **body) -> Iterator[dict]:
- if "maxResults" not in body:
- body["maxResults"] = 100
- while True:
- info: dict = self.get_ads(**body)
- yield from info["productAds"]
- if not info.get("nextToken"):
- break
- body["nextToken"] = info["nextToken"]
- logger.info(f"总共数量:{info['totalResults']}")
- def get_keywords(self, **body):
- url_path = "/sp/keywords/list"
- headers = {
- "Accept": "application/vnd.spKeyword.v3+json",
- "Content-Type": "application/vnd.spKeyword.v3+json"
- }
- return self._request(url_path, method="POST", body=body, headers=headers)
- def iter_keywords(self, **body) -> Iterator[dict]:
- if "maxResults" not in body:
- body["maxResults"] = 100
- while True:
- info: dict = self.get_keywords(**body)
- yield from info["keywords"]
- if not info.get("nextToken"):
- break
- body["nextToken"] = info["nextToken"]
- logger.info(f"总共数量:{info['totalResults']}")
- def get_targets(self, **body):
- url_path = "/sp/targets/list"
- headers = {
- "Accept": "application/vnd.sptargetingClause.v3+json",
- "Content-Type": "application/vnd.sptargetingClause.v3+json"
- }
- return self._request(url_path, method="POST", body=body, headers=headers)
- def iter_targets(self, **body) -> Iterator[dict]:
- if "maxResults" not in body:
- body["maxResults"] = 100
- while True:
- info: dict = self.get_targets(**body)
- yield from info["targetingClauses"]
- if not info.get("nextToken"):
- break
- body["nextToken"] = info["nextToken"]
- logger.info(f"总共数量:{info['totalResults']}")
- def get_budget(self, campaign_ids: list):
- url_path = "/sp/campaigns/budget/usage"
- body = {
- "campaignIds": campaign_ids
- }
- return self._request(url_path, method="POST", body=body)
- def get_adgroup_bidrecommendation(
- self, campaignId: str, adGroupId: str, targetingExpressions: list,
- recommendationType: str = "BIDS_FOR_EXISTING_AD_GROUP"):
- url_path = "/sp/targets/bid/recommendations"
- headers = {
- "Accept": "application/vnd.spthemebasedbidrecommendation.v3+json",
- "Content-Type": "application/vnd.spthemebasedbidrecommendation.v3+json"
- }
- body = {
- "campaignId": campaignId,
- "adGroupId": adGroupId,
- "recommendationType": recommendationType,
- "targetingExpressions": targetingExpressions
- }
- return self._request(url_path, method="POST", body=body, headers=headers)
- def get_keyword_bidrecommendation(self, adGroupId: str, keyword: list, matchType: list):
- keywords = list(map(lambda x: {"keyword": x[0], "matchType": x[1]}, list(zip(keyword, matchType))))
- url_path = "/v2/sp/keywords/bidRecommendations"
- body = {"adGroupId": adGroupId,
- "keywords": keywords}
- return self._request(url_path, method="POST", body=body)
- def get_targets_bid_recommendations(self,campaignId:str=None,
- adGroupId:str=None,
- asins:list=None,
- bid:float=None,
- keyword:str=None,
- userSelectedKeyword:bool=False,
- matchType:Literal["BROAD","EXACT","PHRASE"]="BROAD",
- recommendationType:Literal['KEYWORDS_FOR_ASINS','KEYWORDS_FOR_ADGROUP']="KEYWORDS_FOR_ASINS",
- sortDimension:Literal["CLICKS","CONVERSIONS","DEFAULT"]="DEFAULT",
- locale:Literal["ar_EG" ,"de_DE", "en_AE", "en_AU", "en_CA", "en_GB", "en_IN", "en_SA", "en_SG", "en_US",
- "es_ES", "es_MX", "fr_FR", "it_IT", "ja_JP", "nl_NL", "pl_PL", "pt_BR", "sv_SE", "tr_TR", "zh_CN"]="en_US"):
- url_path = "/sp/targets/keywords/recommendations"
- body = {
- "recommendationType": recommendationType,
- "targets": [
- {
- "matchType": matchType,
- "keyword": keyword,
- "bid": bid,
- "userSelectedKeyword": userSelectedKeyword
- }
- ],
- "maxRecommendations": "200",
- "sortDimension": sortDimension,
- "locale": locale
- }
- if adGroupId is not None:
- body["campaignId"]=campaignId
- body["adGroupId"]= adGroupId
- else:
- body['asins'] = asins
- return self._request(url_path, method="POST", body=body)
- def get_v3_report(self,
- groupby:list,
- columns:list,
- startDate:str,
- endDate:str,
- reportType: Literal['spCampaigns','spAdvertisedProduct' ,'spPurchasedProduct', 'spTargeting', 'spSearchTerm'],
- timeUnit="DAILY",
- download=True):
- """
- @param groupby: 聚合条件,[campaign,adGroup, searchTerm,purchasedAsin,campaignPlacement,targeting,searchTerm,advertiser,asin]
- columns: 需要获取的字段
- """
- url_path = "/reporting/reports"
- headers = {
- "Content-Type":"application/vnd.createasyncreportrequest.v3+json"
- }
- body = {
- "name":"SP campaigns report",
- "startDate":startDate,
- "endDate":endDate,
- "configuration":{
- "adProduct":"SPONSORED_PRODUCTS",
- "groupBy":groupby,
- "columns":columns,
- "reportTypeId":reportType,
- "timeUnit":timeUnit,
- "format":"GZIP_JSON"
- }
- }
- ret = self._request(url_path,method="POST",headers=headers,body=body)
- # print(ret)
- report_id = ret["reportId"]
- status = ret["status"]
- if status == "FAILURE":
- raise Exception(ret)
- logger.info(f"创建报告成功:{ret}")
- while status in ["PROCESSING","PENDING"]:
- logger.debug(f"报告{report_id}正在处理中...")
- time.sleep(4)
- try:
- ret = self._request(f"/reporting/reports/{report_id}")
- except:
- time.sleep(15)
- ret = self._request(f"/reporting/reports/{report_id}")
- print(ret)
- status = ret["status"]
- if status == "FAILURE":
- raise Exception(ret)
- logger.info(f"报告处理完成:{ret}")
- if download:
- pid = self.profile_id
- report_info = {'groupby': groupby,
- 'columns': columns,
- 'startDate': startDate,
- 'endDate': endDate,
- 'reportType': reportType,
- 'timeUnit': timeUnit,
- 'download': download}
- reportrel= self.download_v3_report(report_info,ret['url'],f"s3://reportforspsbsd/zosi/us/sp/{str(groupby)}_{startDate}_{endDate}_{reportType}_{str(pid)}.json.gz")
- return reportrel
- else:
- return ret
- def download_v3_report(self,report_info, url, file_path: str, decompress: bool = True) -> str:
- resp = requests.get(url, stream=True, allow_redirects=True)
- # print(resp)
- if resp.status_code in [200, 207]:
- kwargs = {'region_name': 'us-east-1', 'endpoint_url': "https://s3.amazonaws.com",
- 'aws_access_key_id': 'AKIARBAGHTGORIFN44VQ',
- 'aws_secret_access_key': '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'}
- s3_ = S3FileSystem(client_kwargs=kwargs)
- # print()
- with s3_.open(file_path, 'wb') as f:
- for data in resp.iter_content(chunk_size=10 * 1024):
- f.write(data)
- if not decompress:
- return file_path
- with s3_.open(file_path, 'rb') as f: # 读取s3数据
- data = gzip.GzipFile(fileobj=f, mode='rb')
- de_file = json.load(data)
- logger.info(f"解压完成:{de_file}")
- # print(de_file)
- return de_file
- else:
- logger.info(f"状态码{resp.status_code},开始重试")
- self.get_v3_report(report_info['groupby'], report_info['columns'], report_info['startDate'],
- report_info['endDate'],
- report_info['reportType'], report_info['timeUnit'], report_info['download'])
- class SBClient(BaseClient):
- def get_campaigns(self, **body):
- url_path = "/sb/v4/campaigns/list"
- headers = {
- "Accept": "application/vnd.sbcampaignresouce.v4+json",
- "Content-Type": "application/vnd.sbcampaignresouce.v4+json"
- }
- return self._request(url_path, method="POST", body=body, headers=headers)
- def get_campaign_v3(self, campaignId):
- if campaignId is None:
- url_path = f'/sb/campaigns'
- else:
- url_path = f'/sb/campaigns/{campaignId}'
- return self._request(url_path, method="GET")
- def iter_campaigns(self, **body) -> Iterator[dict]:
- if "maxResults" not in body:
- body["maxResults"] = 100
- while True:
- info: dict = self.get_campaigns(**body)
- yield from info["campaigns"]
- if not info.get("nextToken"):
- break
- body["nextToken"] = info["nextToken"]
- # logger.info(f"总共数量:{info['totalResults']}")
- def get_ad_groups(self, **body):
- url_path = "/sb/v4/adGroups/list"
- headers = {
- 'Content-Type': "application/vnd.sbadgroupresource.v4+json",
- 'Accept': "application/vnd.sbadgroupresource.v4+json"
- }
- return self._request(url_path, method="POST", headers=headers, body=body)
- def iter_adGroups(self, **body) -> Iterator[dict]:
- if "maxResults" not in body:
- body["maxResults"] = 100
- while True:
- info: dict = self.get_ad_groups(**body)
- # print(info)
- yield from info["adGroups"]
- if not info.get("nextToken"):
- break
- body["nextToken"] = info["nextToken"]
- def get_ads(self, **body):
- url_path = "/sb/v4/ads/list"
- headers = {
- 'Content-Type': "application/vnd.sbadresource.v4+json",
- 'Accept': "application/vnd.sbadresource.v4+json"
- }
- return self._request(url_path, method="POST", headers=headers, body=body)
- def iter_ads(self, **body):
- if "maxResults" not in body:
- body["maxResults"] = 100
- while True:
- info: dict = self.get_ads(**body)
- # print(info)
- yield from info["ads"]
- if not info.get("nextToken"):
- break
- body["nextToken"] = info["nextToken"]
- def get_keywords(self,**param):
- url_path = "/sb/keywords"
- return self._request(url_path, method="GET",params=param)
- def get_keyword(self,keywordid):
- url_path = f'/sb/keywords/{keywordid}'
- return self._request(url_path,method="GET")
- def iter_keywords(self,**param):
- if "startIndex" not in param:
- param["startIndex"] = 0
- param["count"] = 5000
- while True:
- info:list = self.get_keywords(**param)
- # print(info)
- if len(info) == 0:
- break
- param["startIndex"] += 5000
- yield info
- def get_targets(self, **body):
- url_path = "/sb/targets/list"
- return self._request(url_path, method="POST", body=body)
- def iter_targets(self, **body):
- if "maxResults" not in body:
- body["maxResults"] = 100
- while True:
- info: dict = self.get_targets(**body)
- # print(info)
- yield from info["targets"]
- if not info.get("nextToken"):
- break
- body["nextToken"] = info["nextToken"]
- def get_budget(self, campaignIds: list):
- url_path = "/sb/campaigns/budget/usage"
- body = {"campaignIds": campaignIds}
- return self._request(url_path, method="POST", body=body)
- def get_keyword_bidrecommendation(self, **body):
- url_path = "/sb/recommendations/bids"
- return self._request(url_path, method="POST", body=body)
- def get_v3_report(self,
- groupby:list,
- columns:list,
- startDate:str,
- endDate:str,
- reportType: Literal['sbCampaigns', 'sbPurchasedProduct', 'sbTargeting', 'sbSearchTerm'],
- timeUnit="DAILY",
- download=True):
- """
- Now about reportType is only sbPurchasedProduct available.
- @param groupby: 聚合条件
- @param columns: 需要获取的字段[campaign,purchasedAsin,targeting,searchTerm]
- @param startDate: 请求开始的日期
- @param endDate: 请求结束的日期
- @param reportType: 广告类型
- @param timeUnit: 时间指标-[DAILY, SUMMARY]
- @param download: 下载报告
- """
- url_path = "/reporting/reports"
- headers = {
- "Content-Type":"application/vnd.createasyncreportrequest.v3+json"
- }
- body = {
- "name":"SB campaigns report",
- "startDate":startDate,
- "endDate":endDate,
- "configuration":{
- "adProduct":"SPONSORED_BRANDS",
- "groupBy":groupby,
- "columns":columns,
- "reportTypeId":reportType,
- "timeUnit":timeUnit,
- "format":"GZIP_JSON"
- }
- }
- ret = self._request(url_path,method="POST",headers=headers,body=body)
- # print(ret)
- report_id = ret["reportId"]
- status = ret["status"]
- if status == "FAILURE":
- raise Exception(ret)
- logger.info(f"创建报告成功:{ret}")
- while status in ["PROCESSING","PENDING"]:
- logger.debug(f"报告{report_id}正在处理中...")
- time.sleep(4)
- try:
- ret = self._request(f"/reporting/reports/{report_id}")
- except:
- time.sleep(15)
- ret = self._request(f"/reporting/reports/{report_id}")
- print(ret)
- status = ret["status"]
- if status == "FAILURE":
- raise Exception(ret)
- logger.info(f"报告处理完成:{ret}")
- if download:
- pid = self.profile_id
- report_info = {'groupby': groupby,
- 'columns': columns,
- 'startDate': startDate,
- 'endDate': endDate,
- 'reportType': reportType,
- 'timeUnit': timeUnit,
- 'download': download}
- reportrel= self.download_v3_report(report_info,ret['url'],f"s3://reportforspsbsd/zosi/us/sb/{startDate}_{endDate}_{reportType}_{str(groupby)}_{str(pid)}.json.gz")
- return reportrel
- else:
- return ret
- def download_v3_report(self, report_info,url, file_path: str, decompress: bool = True) -> str:
- resp = requests.get(url, stream=True, allow_redirects=True)
- # print(resp)
- if resp.status_code in [200, 207]:
- kwargs = {'region_name': 'us-east-1', 'endpoint_url': "https://s3.amazonaws.com",
- 'aws_access_key_id': 'AKIARBAGHTGORIFN44VQ',
- 'aws_secret_access_key': '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'}
- s3_ = S3FileSystem(client_kwargs=kwargs)
- # print()
- with s3_.open(file_path, 'wb') as f:
- for data in resp.iter_content(chunk_size=10 * 1024):
- f.write(data)
- if not decompress:
- return file_path
- with s3_.open(file_path, 'rb') as f: # 读取s3数据
- data = gzip.GzipFile(fileobj=f, mode='rb')
- de_file = json.load(data)
- logger.info(f"解压完成:{de_file}")
- # print(de_file)
- return de_file
- else:
- logger.info(f"状态码{resp.status_code},开始重试")
- self.get_v3_report(report_info['groupby'], report_info['columns'], report_info['startDate'],
- report_info['endDate'],
- report_info['reportType'], report_info['timeUnit'], report_info['download'])
- def get_v2_report(
- self,
- record_type: Literal['campaigns', 'adGroups', 'ads', 'targets', 'keywords'],
- report_date: str,
- metrics: List[str],
- segment: Literal['placement', 'query'] = None,
- creative_type: Literal['video', 'all'] = "all",
- download: bool = True
- ):
- """
- @param download: 是否下载文件
- @param record_type:
- @param report_date: 格式为YYYYMMDD,以请求的卖家市场所对应的时区为准,超过60天的报告不可用
- @param metrics:
- @param segment:
- @param creative_type:
- None:仅包含非视频广告
- 'video':仅包含视频广告
- 'all':包含视频和非视频广告
- @return:
- """
- url = f"/v2/hsa/{record_type}/report"
- body = {
- "reportDate": report_date,
- "metrics": ",".join(metrics),
- "creativeType": creative_type,
- "segment": segment
- }
- if record_type == "ads":
- body["creativeType"] = "all"
- ret = self._request(url, method="POST", body=body)
- report_id = ret["reportId"]
- status = ret["status"]
- if status == "FAILURE":
- raise Exception(ret)
- logger.info(f"创建报告成功:{ret}")
- while status == "IN_PROGRESS":
- logger.debug(f"报告{report_id}正在处理中...")
- time.sleep(4)
- try:
- ret = self._request(f"/v2/reports/{report_id}")
- except:
- time.sleep(15)
- ret = self._request(f"/v2/reports/{report_id}")
- print(ret)
- status = ret["status"]
- if status == "FAILURE":
- raise Exception(ret)
- logger.info(f"报告处理完成:{ret}")
- if download:
- pid = self.profile_id
- report_info = {"record_type": record_type, "report_date": report_date, "metrics": metrics,
- "segment": segment, "creative_type": creative_type, "download": download}
- reportrel= self.download_v2_report(report_info,report_id, f"s3://reportforspsbsd/zosi/us/sb/{str(report_date)}_{record_type}_{creative_type}_{segment}_{str(pid)}.gz")
- return reportrel
- else:
- return ret
- def download_v2_report(self,report_info,report_id: str, file_path: str, decompress: bool = True) -> str:
- url = urljoin(URL_AD_API, f"/v2/reports/{report_id}/download")
- resp = requests.get(url, headers=self.auth_headers, stream=True, allow_redirects=True)
- if resp.status_code in [200, 207]:
- logger.info(f"开始下载报告:{report_id}")
- kwargs = {'region_name': 'us-east-1', 'endpoint_url': "https://s3.amazonaws.com",
- 'aws_access_key_id': 'AKIARBAGHTGORIFN44VQ',
- 'aws_secret_access_key': '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'}
- s3_ = S3FileSystem(client_kwargs=kwargs)
- # print()
- with s3_.open(file_path, 'wb') as f:
- for data in resp.iter_content(chunk_size=10 * 1024):
- f.write(data)
- logger.info(f"报告{report_id}下载完成:{file_path}")
- if not decompress:
- return file_path
- with s3_.open(file_path, 'rb') as f: # 读取s3数据
- data = gzip.GzipFile(fileobj=f, mode='rb')
- de_file = json.load(data)
- logger.info(f"解压完成:{de_file}")
- # print(de_file)
- return de_file
- else:
- logger.info(f"状态码{resp.status_code},开始重试")
- self.get_v2_report(report_info['record_type'], report_info['report_date'], report_info['metrics'],
- report_info['segment'], report_info['creative_type'], report_info['download'])
- class SDClient(BaseClient):
- def get_campaigns(self, **params) -> List[dict]:
- url_path = "/sd/campaigns"
- return self._request(url_path, params=params)
- def get_campaigns_extended(self, **params) -> List[dict]:
- url_path = "/sd/campaigns/extended"
- return self._request(url_path, params=params)
- def get_adGroups(self,**params):
- url_path = '/sd/adGroups'
- return self._request(url_path, params=params)
- def iter_adGroups(self,**param):
- if "startIndex" not in param:
- param["startIndex"] = 0
- param["count"] = 5000
- while True:
- info:list = self.get_adGroups(**param)
- # print(info)
- if len(info) == 0:
- break
- param["startIndex"] += 5000
- yield info
- def get_ads(self,**params):
- url_path = '/sd/productAds'
- return self._request(url_path, params=params)
- def iter_ads(self,**param):
- if "startIndex" not in param:
- param["startIndex"] = 0
- param["count"] = 5000
- while True:
- info:list = self.get_ads(**param)
- # print(info)
- if len(info) == 0:
- break
- param["startIndex"] += 5000
- yield info
- def get_targets(self,**params):
- url_path = '/sd/targets'
- return self._request(url_path, params=params)
- def iter_targets(self,**param):
- if "startIndex" not in param:
- param["startIndex"] = 0
- param["count"] = 5000
- while True:
- info:list = self.get_targets(**param)
- # print(info)
- if len(info) == 0:
- break
- param["startIndex"] += 5000
- yield info
- def get_budget(self, campaignIds: list):
- url_path = "/sd/campaigns/budget/usage"
- body = {"campaignIds": campaignIds}
- return self._request(url_path, method="POST", body=body)
- def get_target_bidrecommendation(self,tactic:str,products:list,typeFilter:list,themes:dict,locale:str='en_US'):#
- url_path = '/sd/targets/recommendations'
- headers ={
- 'Content-Type':"application/vnd.sdtargetingrecommendations.v3.3+json",
- 'Accept':"application/vnd.sdtargetingrecommendations.v3.3+json"
- }
- # "tactic":"T00020",
- # "products":[{"asin":"B00MP57IOY"}],
- # "typeFilter":["PRODUCT"],
- # "themes":{"product":[{"name":"TEST","expression":[{"type":"asinBrandSameAs"}]}]}
- body = {
- "tactic":tactic,
- "products":products,
- "typeFilter":typeFilter,
- "themes":themes
- }
- return self._request(url_path, method="POST", headers=headers,body=body,params={"locale":locale})
- def get_v3_report(self,
- groupby:list,
- columns:list,
- startDate:str,
- endDate:str,
- reportType: Literal['sdCampaigns', 'sdPurchasedProduct', 'sdTargeting', 'sdSearchTerm'],
- timeUnit="DAILY",
- download=True):
- """
- Now about reportType is only sbPurchasedProduct available.
- @param groupby: 聚合条件
- @param columns: 需要获取的字段[campaign,purchasedAsin,targeting,searchTerm]
- @param startDate: 请求开始的日期
- @param endDate: 请求结束的日期
- @param reportType: 广告类型
- @param timeUnit: 时间指标-[DAILY, SUMMARY]
- @param download: 下载报告
- """
- url_path = "/reporting/reports"
- headers = {
- "Content-Type":"application/vnd.createasyncreportrequest.v3+json"
- }
- body = {
- "name":"SD campaigns report",
- "startDate":startDate,
- "endDate":endDate,
- "configuration":{
- "adProduct":"SPONSORED_DISPLAY",
- "groupBy":groupby,
- "columns":columns,
- "reportTypeId":reportType,
- "timeUnit":timeUnit,
- "format":"GZIP_JSON"
- }
- }
- ret = self._request(url_path,method="POST",headers=headers,body=body)
- # print(ret)
- report_id = ret["reportId"]
- status = ret["status"]
- if status == "FAILURE":
- raise Exception(ret)
- logger.info(f"创建报告成功:{ret}")
- while status in ["PROCESSING","PENDING"]:
- logger.debug(f"报告{report_id}正在处理中...")
- time.sleep(4)
- try:
- ret = self._request(f"/reporting/reports/{report_id}")
- except:
- time.sleep(15)
- ret = self._request(f"/reporting/reports/{report_id}")
- print(ret)
- status = ret["status"]
- if status == "FAILURE":
- raise Exception(ret)
- logger.info(f"报告处理完成:{ret}")
- if download:
- pid = self.profile_id
- report_info = {'groupby':groupby,
- 'columns':columns,
- 'startDate':startDate,
- 'endDate':endDate,
- 'reportType': reportType,
- 'timeUnit':timeUnit,
- 'download':download}
- reportrel= self.download_v3_report(report_info,ret['url'],f"s3://reportforspsbsd/zosi/us/sd/{startDate}_{endDate}_{reportType}_{str(groupby)}_{str(pid)}.json.gz")
- return reportrel
- else:
- return ret
- def download_v3_report(self,report_info, url, file_path: str, decompress: bool = True) -> str:
- resp = requests.get(url, stream=True, allow_redirects=True)
- # print(resp)
- if resp.status_code in [200,207]:
- kwargs = {'region_name': 'us-east-1', 'endpoint_url': "https://s3.amazonaws.com",
- 'aws_access_key_id': 'AKIARBAGHTGORIFN44VQ',
- 'aws_secret_access_key': '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'}
- s3_ = S3FileSystem(client_kwargs=kwargs)
- # print()
- with s3_.open(file_path, 'wb') as f:
- for data in resp.iter_content(chunk_size=10 * 1024):
- f.write(data)
- if not decompress:
- return file_path
- with s3_.open(file_path, 'rb') as f: # 读取s3数据
- data = gzip.GzipFile(fileobj=f, mode='rb')
- de_file = json.load(data)
- logger.info(f"解压完成:{de_file}")
- # print(de_file)
- return de_file
- else:
- logger.info(f"状态码{resp.status_code},开始重试")
- self.get_v3_report(report_info['groupby'],report_info['columns'],report_info['startDate'],report_info['endDate'],
- report_info['reportType'],report_info['timeUnit'],report_info['download'])
- def get_v2_report(
- self,
- record_type: Literal['campaigns', 'adGroups', 'productAds', 'targets', 'asins'],
- report_date: str,
- metrics: List[str],
- segment: Literal['matchedTarget'] = None,
- tactic: Literal['T00020', 'T00030'] = None,
- download: bool = True
- ):
- """
- @param download: 是否下载文件
- @param record_type:
- @param report_date: 格式为YYYYMMDD,以请求的卖家市场所对应的时区为准,超过60天的报告不可用
- @param metrics:
- @param segment:
- @param tactic:
- T00020: contextual targeting
- T00030: audience targeting
- @return:
- """
- url = f"/sd/{record_type}/report"
- body = {
- "reportDate": report_date,
- "metrics": ",".join(metrics),
- "tactic": tactic,
- "segment": segment
- }
- ret = self._request(url, method="POST", body=body)
- report_id = ret["reportId"]
- status = ret["status"]
- print(ret)
- if status == "FAILURE":
- raise Exception(ret)
- logger.info(f"创建报告成功:{ret}")
- while status == "IN_PROGRESS":
- logger.debug(f"报告{report_id}正在处理中...")
- time.sleep(4)
- try:
- ret = self._request(f"/v2/reports/{report_id}")
- except:
- time.sleep(15)
- ret = self._request(f"/v2/reports/{report_id}")
- print(ret)
- status = ret["status"]
- if status == "FAILURE":
- raise Exception(ret)
- logger.info(f"报告处理完成:{ret}")
- if download:
- pid = self.profile_id
- report_info = {"record_type":record_type,"report_date":report_date,"metrics":metrics,"segment":segment,"tactic":tactic,"download":download}
- reportrel= self.download_v2_report(report_info,report_id, f"s3://reportforspsbsd/zosi/us/sd/{str(report_date)}_{record_type}_{tactic}_{segment}_{str(pid)}.gz")
- return reportrel
- else:
- return ret
- def download_v2_report(self, report_info,report_id: str, file_path: str, decompress: bool = True) -> str:
- url = urljoin(URL_AD_API, f"/v2/reports/{report_id}/download")
- resp = requests.get(url, headers=self.auth_headers, stream=True, allow_redirects=True)
- # print(resp.status_code)
- if resp.status_code in [200,207]:
- logger.info(f"开始下载报告:{report_id}")
- kwargs = {'region_name': 'us-east-1', 'endpoint_url': "https://s3.amazonaws.com",
- 'aws_access_key_id': 'AKIARBAGHTGORIFN44VQ',
- 'aws_secret_access_key': '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'}
- s3_ = S3FileSystem(client_kwargs=kwargs)
- # print()
- with s3_.open(file_path, 'wb') as f:
- for data in resp.iter_content(chunk_size=10 * 1024):
- # print(resp.text)
- f.write(data)
- logger.info(f"报告{report_id}下载完成:{file_path}")
- if not decompress:
- return file_path
- with s3_.open(file_path, 'rb') as f: # 读取s3数据
- data = gzip.GzipFile(fileobj=f, mode='rb')
- de_file = json.load(data)
- logger.info(f"解压完成:{de_file}")
- # print(de_file)
- return de_file
- else:
- logger.info(f"状态码{resp.status_code},开始重试")
- self.get_v2_report(report_info['record_type'],report_info['report_date'],report_info['metrics'],
- report_info['segment'],report_info['tactic'],report_info['download'])
- class Account(BaseClient):
- def get_portfolios(self):
- url_path = "/v2/portfolios/extended"
- return self._request(url_path)
- def iter_portfolios(self):
- yield from self.get_portfolios()
- AccountClient = Account
- if __name__ == '__main__':
- AWS_CREDENTIALS = {
- 'lwa_client_id': 'amzn1.application-oa2-client.ebd701cd07854fb38c37ee49ec4ba109',
- 'refresh_token': "Atzr|IwEBIL4ur8kbcwRyxVu_srprAAoTYzujnBvA6jU-0SMxkRgOhGjYJSUNGKvw24EQwJa1jG5RM76mQD2P22AKSq8qSD94LddoXGdKDO74eQVYl0RhuqOMFqdrEZpp1p4bIR6_N8VeSJDHr7UCuo8FiabkSHrkq7tsNvRP-yI-bnpQv4EayPBh7YwHVX3hYdRbhxaBvgJENgCuiEPb35Q2-Z6w6ujjiKUAK2VSbCFpENlEfcHNsjDeY7RCvFlwlCoHj1IeiNIaFTE9yXFu3aEWlExe3LzHv6PZyunEi88QJSXKSh56Um0e0eEg05rMv-VBM83cAqc5POmZnTP1vUdZO8fQv3NFLZ-xU6e1WQVxVPi5Cyqk4jYhGf1Y9t98N654y0tVvw74qNIsTrB-8bGS0Uhfe24oBEWmzObvBY3zhtT1d42myGUJv4pMTU6yPoS83zhPKm3LbUDEpBA1hvvc_09jHk7vUEAuFB-UAZzlht2C1yklzQ",
- 'lwa_client_secret': 'cbf0514186db4df91e04a8905f0a91b605eae4201254ced879d8bb90df4b474d',
- 'profile_id': "3006125408623189"
- }
- # sp = SPClient(**AWS_CREDENTIALS)
- # print(sp.get_keyword_bidrecommendation(
- # adGroupId="119753215871672",
- # keyword=["8mp security camera system","8mp security camera system"],
- # matchType=["broad","exact"]))
- sb = SDClient(**AWS_CREDENTIALS)
- # sb.get_v3_report(groupby=["campaign"],columns=["impressions","date"],startDate="2023-10-28",endDate="2023-10-28",reportType="sdCampaigns",timeUnit="DAILY")
- # print(list(sb.iter_budgetrecommendation(['147691704431878', '60271227965408', '218847416529861', '31392773399718', '262035857074479', '198816492559645', '142984587494761', '56817060975858', '25915710734770', '129767234792339', '157524678908837', '49318230260950', '108960112862154', '62467550507341', '251456127331427', '191378898823474', '120392223446402', '247773821977107', '280377532791660', '184950658810783', '164014978241334', '123919526909988', '130880921982647', '126821145840591', '64491219404125', '38337331569585', '116386348992750', '225036289048302', '156661647012185', '144776397901336', '135236490839193', '169772039957761', '80512764023579', '34385013996533', '120697809283682', '246829191189710', '209056522772792', '232902564083581', '3932823953797', '279860689033033', '148947795709523', '97303001527474', '273793489896841', '166028784537215', '39300113616652', '170015910542201', '273987458393412', '171417956384778', '179418644846675', '93362211056849', '183219549121837', '92109046525620', '209610737481328', '64551171635322', '104421263246026', '107129361457199', '180558158817613', '196152550852335', '274383816868050', '153176862530690', '202668080336520', '139339123933891', '216562245832724', '44126930182871', '158793558529257', '163377434993147', '129760407316857', '259206875182868', '254478421786009', '113623886210537', '123264383028090', '114995189965872', '126327624499318', '111423039176174', '218824374284099', '268581491758278', '221198600183221', '252229497958387', '25969190496597', '147213408548844', '120873185867848', '121127240307802', '149837836567172', '244566073561396', '170971926269997', '50598109145873', '94661978287830', '172459323917375', '79239463046520', '161538254020266', '122877215020077', '19390096189319', '84671881754842', '56035811352399', '127311973972957', '99871114075939', '216044477480148', '212849641880903', '96517925473279', '140235725339419', '141444557365069', '2246672580150', '268090880021982', '94042224869659', '49225748581620', '32725632149299', '40908978446751', '146895818081903', '119917780655231', '146458404145911', '118070860722352', '52022434573022', '272598548490634', '16095673755650', '172664047341294', '256277301042945', '196836379347636', '155301894644769', '274223966125410', '248132117356305', '57660814157093', '50226094984793', '28888390047403', '102108408531327', '30079789635585', '223870235275688', '184420890768530', '29862567915039', '39565569376716', '5130702823897', '193159277950903', '155681125793546', '147688196248459', '246947393077054', '31511403651405', '102765494942726', '37856299838393', '231975314936513', '241347601457737', '59068161406145', '195628702544128', '225472432237809', '247179558013703', '114349375196504', '247845805126534', '50893503004023', '21955509658149', '66932634825184', '281441197839505', '255188169284953', '127289804144979', '168277283490230', '67066099773166', '14095630154088', '14246020074735', '272850527640233', '107029528476360', '174968043962800', '221862209153056', '116700370772313', '104020924872149', '97962041521658', '173158222344275', '185251252451477', '74364105565262', '210932538222999', '63297563429758', '276793053074864', '69715214871405', '95970937392401', '32561213134196', '33142883019280', '79216188082798', '59643351291635', '76327385728260', '116202606958791', '167409692560139', '171577662027638', '41421288964538', '150057207183605', '154717958881150', '114788039648066', '107895719250913', '264030622380992', '172196786467310', '197934421091867', '278388674751612', '45379253028975', '122119878478906', '4533827464348', '130815119156456', '137297479866563', '250767198691934', '139253473761708', '112336508594346', '132816688267091', '57709263376416', '249118660318975', '196638816684572', '92891389830198', '208322940506617', '186709333461759', '185422701325753', '270743781107196', '150694054972074', '193071867166263', '279972459852484', '119252950300630', '124990749954236', '266097963051545', '234638916539784', '20605146781735', '70768902397459', '154986591065926', '159501779813069', '162103896356568', '460593835599747', '410212175498241', '557726418497539', '500143110670441', '355416669121026', '431780944586985', '404895228651677', '388038108990987', '464118197356560', '521980826814295', '469329788053854', '326468917818944', '552954913725893', '542546450513278', '325523075677132', '392468912549092', '527886948735997', '329385433739622', '485978120289879', '325681364822312', '555651735003802', '303081891898256', '290254871141701', '485921949741399', '403591067235790', '499317623967079', '293479361575582', '495483931857167', '559648871033557', '336635682793609', '471666122828785', '537556291117721', '523813506535076', '497250432979707', '442860218481252', '448893131612583', '281694643275712', '433377458106838', '442612845985546', '338829853627078', '392584497224138', '496308094986157', '418568230991874', '378377235258783', '478649462904301', '369874181350855', '420881761417240', '360520776254966', '479975368002715', '390542812871179', '395983847529920', '390131732881184', '383692739831773', '444758167627464', '453566341896795', '496145304023336', '427176120966955', '310665337034129', '477718522757455', '535119828991333', '375580793899192', '464596753380107', '327731861279726', '294079129793082', '360342567843115', '310372350013643', '235356299301347', '265522205087323', '228344360452595', '264342228103465', '122100911164709', '232859308822086', '45261323402141', '65662811257626', '234144786032766', '219449168841685', '128805550207790', '52164236957007', '120413947884525', '247101003653911', '22887864793841', '66188387334596', '102602610195475', '14284441019308', '125676608715613', '208268030289407', '237637021820467', '83135684198446', '154786784931406', '34854308519962', '8788604610896', '46715264141017', '139624985843170', '220476381163737', '109100736225759', '56729203013140', '88373528260613', '3312332033772', '37834945448724', '94120697716118', '193841489621149', '176450446850186', '166966792230306', '168345583834458', '63645396093211', '21250682621308', '43999955361946', '91246816921037', '256738400830651', '141723939372941', '2925041027398', '209321026962101', '260728226512366', '139367584185686', '264968517312373', '46556032756649', '55837615659599', '6217208882388', '212383697581072', '13384963604097', '220553842518820', '216909098017681', '164205523483164', '140262174434441', '204728710865941', '257987760095645', '74010928042922', '218130080477762', '40247744447213', '243863605109393', '160210698808714', '23666771936859', '209074182215992', '183440625321762', '10008326799771', '251040907550889', '50479853741108', '98121074839083', '182666986837920', '75110020202471', '277378379542982', '137193580729176', '84426787297480', '238858183340317', '270834245781899']
- # )))
- # print(list(sb.iter_campaigns(**{"stateFilter": {
- # "include": ["ARCHIVED","PAUSED","ENABLED"]
- # }})))
- # print(sb.get_keyword_bidrecommendation(**{'campaignId': 27333596383941, 'keywords': [
- # {"matchType": 'broad', "keywordText": "4k security camera system"}]}))
- # a = list(sd.iter_targets(**{"campaignIdFilter":"257424912382921"})) #list(sd.iter_targets())#
- # print(a,len(a))
- # sb = SBClient(**AWS_CREDENTIALS)
- # print(sd.get_v2_report(record_type="campaigns",report_date="20231020",tactic="T00030",metrics=['impressions']))
|