Skip to content

Commit a0adb18

Browse files
committed
Move data loading libs to web-python
1 parent 2efd3a7 commit a0adb18

File tree

1 file changed

+12
-132
lines changed

1 file changed

+12
-132
lines changed

projects.yaml

Lines changed: 12 additions & 132 deletions
Original file line numberDiff line numberDiff line change
@@ -2711,95 +2711,6 @@ projects:
27112711
github_id: rapidsai/cusignal
27122712
description: "GPU accelerated signal processing."
27132713
category: gpu-utilities
2714-
# Data Loading & Extraction
2715-
- name: Tablib
2716-
pypi_id: tablib
2717-
github_id: jazzband/tablib
2718-
conda_id: conda-forge/tablib
2719-
category: data-loading
2720-
- name: python-magic
2721-
pypi_id: python-magic
2722-
github_id: ahupp/python-magic
2723-
conda_id: conda-forge/python-magic
2724-
category: data-loading
2725-
- name: SDV
2726-
pypi_id: sdv
2727-
github_id: sdv-dev/SDV
2728-
category: data-loading
2729-
- name: Intake
2730-
pypi_id: intake
2731-
github_id: intake/intake
2732-
conda_id: conda-forge/intake
2733-
category: data-loading
2734-
- name: csvkit
2735-
pypi_id: csvkit
2736-
github_id: wireservice/csvkit
2737-
conda_id: conda-forge/csvkit
2738-
category: data-loading
2739-
- name: snorkel
2740-
pypi_id: snorkel
2741-
github_id: snorkel-team/snorkel
2742-
conda_id: conda-forge/snorkel
2743-
category: data-loading
2744-
- name: pyexcel-xlsx
2745-
pypi_id: pyexcel-xlsx
2746-
github_id: pyexcel/pyexcel-xlsx
2747-
conda_id: conda-forge/pyexcel-xlsx
2748-
category: data-loading
2749-
- name: Faker
2750-
pypi_id: Faker
2751-
github_id: joke2k/faker
2752-
conda_id: conda-forge/faker
2753-
category: data-loading
2754-
- name: smart-open
2755-
pypi_id: smart-open
2756-
github_id: RaRe-Technologies/smart_open
2757-
category: data-loading
2758-
- name: pandas-datareader
2759-
pypi_id: pandas-datareader
2760-
github_id: pydata/pandas-datareader
2761-
conda_id: conda-forge/pandas-datareader
2762-
labels: ["pandas"]
2763-
category: data-loading
2764-
- name: openpyxl
2765-
pypi_id: openpyxl
2766-
gitlab_id: "https://foss.heptapod.net/api/graphql::openpyxl/openpyxl"
2767-
conda_id: openpyxl
2768-
dockerhub_id: "openpyxl/openpyxl-ci"
2769-
docs_url: https://openpyxl.readthedocs.io/en/stable/
2770-
license: MIT
2771-
category: data-loading
2772-
- name: TensorFlow Datasets
2773-
pypi_id: tensorflow-datasets
2774-
github_id: tensorflow/datasets
2775-
labels: ["tensorflow"]
2776-
category: data-loading
2777-
- name: textract
2778-
pypi_id: textract
2779-
github_id: deanmalmgren/textract
2780-
conda_id: conda-forge/textract
2781-
category: data-loading
2782-
- name: PDFMiner
2783-
pypi_id: pdfminer
2784-
conda_id: conda-forge/pdfminer
2785-
github_id: euske/pdfminer
2786-
category: data-loading
2787-
- name: xmltodict
2788-
pypi_id: xmltodict
2789-
github_id: martinblech/xmltodict
2790-
conda_id: conda-forge/xmltodict
2791-
category: data-loading
2792-
- name: Singer
2793-
pypi_id: singer-python
2794-
github_id: singer-io/getting-started
2795-
description: "Standard for moving data between databases, web APIs, files, queues, and just about anything else you can think of."
2796-
license: AGPL-3.0
2797-
category: data-loading
2798-
- name: xlrd
2799-
pypi_id: xlrd
2800-
github_id: python-excel/xlrd
2801-
conda_id: conda-forge/xlrd
2802-
category: data-loading
28032714
# Data Pipelines & Streaming
28042715
- name: Great Expectations
28052716
pypi_id: great_expectations
@@ -3578,15 +3489,18 @@ projects:
35783489
github_id: erikbern/ann-benchmarks
35793490
resource: True
35803491
category: nn-search
3581-
- name: Datasets
3582-
pypi_id: datasets
3583-
github_id: huggingface/datasets
3584-
category: data-loading
35853492
- name: best-of-web-python - Web Scraping
35863493
github_id: ml-tooling/best-of-web-python
3494+
homepage: https://github.com/ml-tooling/best-of-web-python#web-scraping--crawling
35873495
description: "Collection of web-scraping and crawling libraries."
35883496
resource: True
35893497
category: web-scraping
3498+
- name: best-of-web-python - Data Extraction
3499+
github_id: ml-tooling/best-of-web-python
3500+
homepage: https://github.com/ml-tooling/best-of-web-python#data-loading--extraction
3501+
description: "Collection of data-loading and -extraction libraries."
3502+
resource: True
3503+
category: data-loading
35903504
- name: m2cgen
35913505
github_id: BayesWitnesses/m2cgen
35923506
category: "model-serialisation"
@@ -3623,23 +3537,6 @@ projects:
36233537
category: data-containers
36243538
conda_id: conda-forge/bcolz
36253539
pypi_id: bcolz
3626-
- name: tabulator-py
3627-
github_id: frictionlessdata/tabulator-py
3628-
category: data-loading
3629-
conda_id: conda-forge/tabulator-py
3630-
pypi_id: tabulator
3631-
- name: messytables
3632-
github_id: okfn/messytables
3633-
category: data-loading
3634-
pypi_id: messytables
3635-
- name: datatest
3636-
github_id: shawnbrown/datatest
3637-
category: data-loading
3638-
pypi_id: datatest
3639-
- name: rows
3640-
github_id: turicas/rows
3641-
category: data-loading
3642-
pypi_id: rows
36433540
- name: dpark
36443541
github_id: douban/dpark
36453542
category: data-pipelines
@@ -4220,28 +4117,6 @@ projects:
42204117
github_id: pola-rs/polars
42214118
category: data-containers
42224119
pypi_id: polars
4223-
- name: deepdish
4224-
github_id: uchicago-cs/deepdish
4225-
category: data-loading
4226-
conda_id: conda-forge/deepdish
4227-
pypi_id: deepdish
4228-
- name: camelot
4229-
github_id: camelot-dev/camelot
4230-
category: data-loading
4231-
pypi_id: camelot
4232-
- name: excalibur
4233-
github_id: camelot-dev/excalibur
4234-
category: data-loading
4235-
pypi_id: excalibur-py
4236-
- name: xlwings
4237-
github_id: xlwings/xlwings
4238-
category: data-loading
4239-
conda_id: conda-forge/xlwings
4240-
pypi_id: xlwings
4241-
- name: csvs-to-sqlite
4242-
github_id: simonw/csvs-to-sqlite
4243-
category: data-loading
4244-
pypi_id: csvs-to-sqlite
42454120
- name: huey
42464121
github_id: coleifer/huey
42474122
category: data-pipelines
@@ -4491,3 +4366,8 @@ projects:
44914366
github_id: linkedin/greykite
44924367
category: time-series-data
44934368
pypi_id: greykite
4369+
- name: TensorFlow Datasets
4370+
pypi_id: tensorflow-datasets
4371+
github_id: tensorflow/datasets
4372+
labels: ["tensorflow"]
4373+
category: tensorflow-utils

0 commit comments

Comments
 (0)