Skip to content

Commit 4b0d8b3

Browse files
committed
Try smaller chunk size
1 parent 9dd2757 commit 4b0d8b3

File tree

1 file changed

+4
-4
lines changed

1 file changed

+4
-4
lines changed

adscrawler/app_stores/scrape_stores.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -130,7 +130,7 @@ def update_app_details(
130130
df = df.sort_values("country_code").reset_index(drop=True)
131131
logger.info(f"{log_info} start {len(df)} apps")
132132

133-
max_chunk_size = 3000
133+
max_chunk_size = 1000
134134
chunks = []
135135
# Try keeping countries together for larger end S3 files
136136
for _country, country_df in df.groupby("country_code"):
@@ -644,9 +644,9 @@ def save_developer_info(
644644
apps_df: pd.DataFrame,
645645
database_connection: PostgresCon,
646646
) -> pd.DataFrame:
647-
assert apps_df["developer_id"].to_numpy()[0], (
648-
f"{apps_df['store_id']} Missing Developer ID"
649-
)
647+
assert apps_df["developer_id"].to_numpy()[
648+
0
649+
], f"{apps_df['store_id']} Missing Developer ID"
650650
df = (
651651
apps_df[["store", "developer_id", "developer_name"]]
652652
.rename(columns={"developer_name": "name"})

0 commit comments

Comments
 (0)