@@ -2711,95 +2711,6 @@ projects:
27112711 github_id : rapidsai/cusignal
27122712 description : " GPU accelerated signal processing."
27132713 category : gpu-utilities
2714- # Data Loading & Extraction
2715- - name : Tablib
2716- pypi_id : tablib
2717- github_id : jazzband/tablib
2718- conda_id : conda-forge/tablib
2719- category : data-loading
2720- - name : python-magic
2721- pypi_id : python-magic
2722- github_id : ahupp/python-magic
2723- conda_id : conda-forge/python-magic
2724- category : data-loading
2725- - name : SDV
2726- pypi_id : sdv
2727- github_id : sdv-dev/SDV
2728- category : data-loading
2729- - name : Intake
2730- pypi_id : intake
2731- github_id : intake/intake
2732- conda_id : conda-forge/intake
2733- category : data-loading
2734- - name : csvkit
2735- pypi_id : csvkit
2736- github_id : wireservice/csvkit
2737- conda_id : conda-forge/csvkit
2738- category : data-loading
2739- - name : snorkel
2740- pypi_id : snorkel
2741- github_id : snorkel-team/snorkel
2742- conda_id : conda-forge/snorkel
2743- category : data-loading
2744- - name : pyexcel-xlsx
2745- pypi_id : pyexcel-xlsx
2746- github_id : pyexcel/pyexcel-xlsx
2747- conda_id : conda-forge/pyexcel-xlsx
2748- category : data-loading
2749- - name : Faker
2750- pypi_id : Faker
2751- github_id : joke2k/faker
2752- conda_id : conda-forge/faker
2753- category : data-loading
2754- - name : smart-open
2755- pypi_id : smart-open
2756- github_id : RaRe-Technologies/smart_open
2757- category : data-loading
2758- - name : pandas-datareader
2759- pypi_id : pandas-datareader
2760- github_id : pydata/pandas-datareader
2761- conda_id : conda-forge/pandas-datareader
2762- labels : ["pandas"]
2763- category : data-loading
2764- - name : openpyxl
2765- pypi_id : openpyxl
2766- gitlab_id : " https://foss.heptapod.net/api/graphql::openpyxl/openpyxl"
2767- conda_id : openpyxl
2768- dockerhub_id : " openpyxl/openpyxl-ci"
2769- docs_url : https://openpyxl.readthedocs.io/en/stable/
2770- license : MIT
2771- category : data-loading
2772- - name : TensorFlow Datasets
2773- pypi_id : tensorflow-datasets
2774- github_id : tensorflow/datasets
2775- labels : ["tensorflow"]
2776- category : data-loading
2777- - name : textract
2778- pypi_id : textract
2779- github_id : deanmalmgren/textract
2780- conda_id : conda-forge/textract
2781- category : data-loading
2782- - name : PDFMiner
2783- pypi_id : pdfminer
2784- conda_id : conda-forge/pdfminer
2785- github_id : euske/pdfminer
2786- category : data-loading
2787- - name : xmltodict
2788- pypi_id : xmltodict
2789- github_id : martinblech/xmltodict
2790- conda_id : conda-forge/xmltodict
2791- category : data-loading
2792- - name : Singer
2793- pypi_id : singer-python
2794- github_id : singer-io/getting-started
2795- description : " Standard for moving data between databases, web APIs, files, queues, and just about anything else you can think of."
2796- license : AGPL-3.0
2797- category : data-loading
2798- - name : xlrd
2799- pypi_id : xlrd
2800- github_id : python-excel/xlrd
2801- conda_id : conda-forge/xlrd
2802- category : data-loading
28032714 # Data Pipelines & Streaming
28042715 - name : Great Expectations
28052716 pypi_id : great_expectations
@@ -3578,15 +3489,18 @@ projects:
35783489 github_id : erikbern/ann-benchmarks
35793490 resource : True
35803491 category : nn-search
3581- - name : Datasets
3582- pypi_id : datasets
3583- github_id : huggingface/datasets
3584- category : data-loading
35853492 - name : best-of-web-python - Web Scraping
35863493 github_id : ml-tooling/best-of-web-python
3494+ homepage : https://github.com/ml-tooling/best-of-web-python#web-scraping--crawling
35873495 description : " Collection of web-scraping and crawling libraries."
35883496 resource : True
35893497 category : web-scraping
3498+ - name : best-of-web-python - Data Extraction
3499+ github_id : ml-tooling/best-of-web-python
3500+ homepage : https://github.com/ml-tooling/best-of-web-python#data-loading--extraction
3501+ description : " Collection of data-loading and -extraction libraries."
3502+ resource : True
3503+ category : data-loading
35903504 - name : m2cgen
35913505 github_id : BayesWitnesses/m2cgen
35923506 category : " model-serialisation"
@@ -3623,23 +3537,6 @@ projects:
36233537 category : data-containers
36243538 conda_id : conda-forge/bcolz
36253539 pypi_id : bcolz
3626- - name : tabulator-py
3627- github_id : frictionlessdata/tabulator-py
3628- category : data-loading
3629- conda_id : conda-forge/tabulator-py
3630- pypi_id : tabulator
3631- - name : messytables
3632- github_id : okfn/messytables
3633- category : data-loading
3634- pypi_id : messytables
3635- - name : datatest
3636- github_id : shawnbrown/datatest
3637- category : data-loading
3638- pypi_id : datatest
3639- - name : rows
3640- github_id : turicas/rows
3641- category : data-loading
3642- pypi_id : rows
36433540 - name : dpark
36443541 github_id : douban/dpark
36453542 category : data-pipelines
@@ -4220,28 +4117,6 @@ projects:
42204117 github_id : pola-rs/polars
42214118 category : data-containers
42224119 pypi_id : polars
4223- - name : deepdish
4224- github_id : uchicago-cs/deepdish
4225- category : data-loading
4226- conda_id : conda-forge/deepdish
4227- pypi_id : deepdish
4228- - name : camelot
4229- github_id : camelot-dev/camelot
4230- category : data-loading
4231- pypi_id : camelot
4232- - name : excalibur
4233- github_id : camelot-dev/excalibur
4234- category : data-loading
4235- pypi_id : excalibur-py
4236- - name : xlwings
4237- github_id : xlwings/xlwings
4238- category : data-loading
4239- conda_id : conda-forge/xlwings
4240- pypi_id : xlwings
4241- - name : csvs-to-sqlite
4242- github_id : simonw/csvs-to-sqlite
4243- category : data-loading
4244- pypi_id : csvs-to-sqlite
42454120 - name : huey
42464121 github_id : coleifer/huey
42474122 category : data-pipelines
@@ -4491,3 +4366,8 @@ projects:
44914366 github_id : linkedin/greykite
44924367 category : time-series-data
44934368 pypi_id : greykite
4369+ - name : TensorFlow Datasets
4370+ pypi_id : tensorflow-datasets
4371+ github_id : tensorflow/datasets
4372+ labels : ["tensorflow"]
4373+ category : tensorflow-utils
0 commit comments