|
2 | 2 |
|
3 | 3 | import logging |
4 | 4 |
|
5 | | -import pandas as pd |
6 | | - |
7 | 5 | from download_analytics.metrics import compute_metrics |
8 | | -from download_analytics.output import create_csv, get_path, load_csv |
| 6 | +from download_analytics.output import create_csv, get_path |
9 | 7 | from download_analytics.pypi import get_pypi_downloads |
| 8 | +from download_analytics.summarize import get_previous_pypi_downloads |
10 | 9 |
|
11 | 10 | LOGGER = logging.getLogger(__name__) |
12 | 11 |
|
@@ -49,27 +48,28 @@ def collect_downloads( |
49 | 48 | if not projects: |
50 | 49 | raise ValueError('No projects have been passed') |
51 | 50 |
|
52 | | - LOGGER.info(f'Collecting downloads for projects={projects}') |
| 51 | + LOGGER.info(f'Collecting new downloads for projects={projects}') |
53 | 52 |
|
54 | 53 | csv_path = get_path(output_folder, 'pypi.csv') |
55 | | - read_csv_kwargs = { |
56 | | - 'parse_dates': ['timestamp'], |
57 | | - 'dtype': { |
58 | | - 'country_code': pd.CategoricalDtype(), |
59 | | - 'project': pd.CategoricalDtype(), |
60 | | - 'version': pd.CategoricalDtype(), |
61 | | - 'type': pd.CategoricalDtype(), |
62 | | - 'installer_name': pd.CategoricalDtype(), |
63 | | - 'implementation_name': pd.CategoricalDtype(), |
64 | | - 'implementation_version': pd.CategoricalDtype(), |
65 | | - 'distro_name': pd.CategoricalDtype(), |
66 | | - 'distro_version': pd.CategoricalDtype(), |
67 | | - 'system_name': pd.CategoricalDtype(), |
68 | | - 'system_release': pd.CategoricalDtype(), |
69 | | - 'cpu': pd.CategoricalDtype(), |
70 | | - }, |
71 | | - } |
72 | | - previous = load_csv(csv_path, dry_run=dry_run, read_csv_kwargs=read_csv_kwargs) |
| 54 | + # read_csv_kwargs = { |
| 55 | + # 'parse_dates': ['timestamp'], |
| 56 | + # 'dtype': { |
| 57 | + # 'country_code': pd.CategoricalDtype(), |
| 58 | + # 'project': pd.CategoricalDtype(), |
| 59 | + # 'version': pd.CategoricalDtype(), |
| 60 | + # 'type': pd.CategoricalDtype(), |
| 61 | + # 'installer_name': pd.CategoricalDtype(), |
| 62 | + # 'implementation_name': pd.CategoricalDtype(), |
| 63 | + # 'implementation_version': pd.CategoricalDtype(), |
| 64 | + # 'distro_name': pd.CategoricalDtype(), |
| 65 | + # 'distro_version': pd.CategoricalDtype(), |
| 66 | + # 'system_name': pd.CategoricalDtype(), |
| 67 | + # 'system_release': pd.CategoricalDtype(), |
| 68 | + # 'cpu': pd.CategoricalDtype(), |
| 69 | + # }, |
| 70 | + # } |
| 71 | + previous = get_previous_pypi_downloads(input_file=None, output_folder=output_folder) |
| 72 | + # previous = load_csv(csv_path, read_csv_kwargs=read_csv_kwargs) |
73 | 73 |
|
74 | 74 | pypi_downloads = get_pypi_downloads( |
75 | 75 | projects=projects, |
|
0 commit comments