repository-statistics / python-app /update_metrics.py
LysandreJik's picture
Initial commit
38e70c4
raw
history blame
1.21 kB
import pypistats
from huggingface_hub import list_datasets
from datasets import load_dataset, concatenate_datasets, Dataset
def update_pip_installs():
metrics_datasets = [d.id for d in list_datasets(author='open-source-metrics', use_auth_token=True)]
pip_installs_datasets = [d for d in metrics_datasets if 'pip' in d]
for dataset_name in pip_installs_datasets:
dataset = load_dataset(dataset_name, use_auth_token=True)
library_name = dataset.split('/')[1].split('-')[0]
data = pypistats.overall(library_name, total=True, format="pandas")
data = data.groupby("category").get_group("without_mirrors").sort_values("date")
data.drop('category', axis=1, inplace=True)
data.drop('percent', axis=1, inplace=True)
pypistats_dataset = Dataset.from_pandas(data)
pypistats_dataset.rename_column('downloads', 'num_downloads')
pypistats_dataset.rename_column('date', 'day')
column_names = pypistats_dataset.column_names
column_names.remove('num_downloads')
column_names.remove('day')
pypistats_dataset.remove_columns(column_names)
days = pypistats_dataset['day']
update_pip_installs()