|
59 | 59 | "syntheticData": { |
60 | 60 | "demo": { |
61 | 61 | "heading": "Information about demo dataset", |
62 | | - "description": "A subset of the [Law School Admission Bar](https://www.kaggle.com/datasets/danofer/law-school-admissions-bar-passage)* dataset is used as a demo. Synthetic data will be generated for the following columns:\n \n \n- sex: student gender, i.e. 1 (male), 2 (female);\n- race1: race of student, i.e., asian, black, hispanic, white, other;\n- ugpa: undergraduate GPA of student (average course grades), continous variable;\n- bar: Ground truth label indicating whether or not the student passed the bar, i.e., passed 1st time, passed 2nd time, failed, non-graduated.\n \n \n\nThe CART method will be used evaluate the distribution and correlation differences between the real and synthetic data. CART generally produces higher quality synthetic datasets, but might not run on datasets with categorical variables with 20+ categories. Use Gaussian Copula in those cases.\n \n \n\n*The original paper can be found [here](https://files.eric.ed.gov/fulltext/ED469370.pdf)\n \n \n" |
| 62 | + "description": "A subset of the [Law School Admission Bar](https://www.kaggle.com/datasets/danofer/law-school-admissions-bar-passage)* dataset is used as a demo. Synthetic data will be generated for the following columns:\n \n \n- sex: student gender, i.e. 1 (male), 2 (female);\n- race1: race of student, i.e., asian, black, hispanic, white, other;\n- ugpa: undergraduate GPA of student (average course grades), continous variable;\n- bar: Ground truth label indicating whether or not the student passed the bar, i.e., passed 1st time, passed 2nd time, failed, non-graduated.\n \n \n\nThe The CART method is used to generate the synthetic data. CART generally produces higher quality synthetic datasets, but might not run on datasets with categorical variables with 20+ categories. Use Gaussian Copula in those cases.\n \n \n\n*The original paper can be found [here](https://files.eric.ed.gov/fulltext/ED469370.pdf)\n \n \n" |
63 | 63 | }, |
64 | 64 | "exportToPDF": "Download evaluation report as pdf", |
65 | 65 | "exportToJSON": "Download synthetic data as json", |
|
90 | 90 | "title": "Try it out!", |
91 | 91 | "description": "Do you not have a dataset at hand? No worries use our demo dataset." |
92 | 92 | }, |
93 | | - "columnsInDatasetInfo": "If detected data types are incorrect, please change this locally in the dataset before attaching it again.", |
| 93 | + "columnsInDatasetInfo": "If the detected data types are incorrect, please change this locally in the source dataset before attaching it to the app.", |
94 | 94 | "univariateCharts": "Univariate distributions", |
95 | 95 | "bivariateDistributionRealData": "Bivariate distribution", |
96 | 96 | "univariateDistributionSyntheticData": "Univariate distribution", |
97 | 97 | "bivariateDistributionSyntheticData": "Bivariate distribution", |
98 | 98 | "correlationRealdata": "Correlation matrix", |
99 | 99 | "correlationSyntheticData": "Correlation matrix", |
100 | 100 | "dataSetPreview": { |
101 | | - "heading": "0. Preview of data" |
| 101 | + "heading": "0. Preview of real data" |
102 | 102 | }, |
103 | 103 | "columnsInDataset": "1. Data types detection", |
104 | 104 | "_explanatoryDataAnalysisTitle": "2. Explanatory data analysis", |
|
0 commit comments