|
388 | 388 | " <tbody>\n", |
389 | 389 | " <tr>\n", |
390 | 390 | " <th>0</th>\n", |
391 | | - " <td>0</td>\n", |
392 | | - " <td>26.155148</td>\n", |
| 391 | + " <td>1</td>\n", |
| 392 | + " <td>27.000861</td>\n", |
| 393 | + " <td>3</td>\n", |
| 394 | + " <td>5940.743483</td>\n", |
393 | 395 | " <td>4</td>\n", |
394 | | - " <td>-8.000000</td>\n", |
395 | | - " <td>2</td>\n", |
396 | 396 | " <td>0</td>\n", |
397 | 397 | " </tr>\n", |
398 | 398 | " <tr>\n", |
399 | 399 | " <th>1</th>\n", |
400 | 400 | " <td>1</td>\n", |
401 | | - " <td>37.983907</td>\n", |
| 401 | + " <td>33.685012</td>\n", |
402 | 402 | " <td>3</td>\n", |
403 | | - " <td>1584.939480</td>\n", |
| 403 | + " <td>1747.087586</td>\n", |
404 | 404 | " <td>4</td>\n", |
405 | 405 | " <td>1</td>\n", |
406 | 406 | " </tr>\n", |
407 | 407 | " <tr>\n", |
408 | 408 | " <th>2</th>\n", |
409 | 409 | " <td>0</td>\n", |
410 | | - " <td>67.653086</td>\n", |
| 410 | + " <td>76.212963</td>\n", |
411 | 411 | " <td>5</td>\n", |
412 | | - " <td>1067.917131</td>\n", |
| 412 | + " <td>955.997763</td>\n", |
413 | 413 | " <td>2</td>\n", |
414 | 414 | " <td>0</td>\n", |
415 | 415 | " </tr>\n", |
416 | 416 | " <tr>\n", |
417 | 417 | " <th>3</th>\n", |
418 | | - " <td>0</td>\n", |
419 | | - " <td>48.066803</td>\n", |
| 418 | + " <td>1</td>\n", |
| 419 | + " <td>36.493914</td>\n", |
420 | 420 | " <td>3</td>\n", |
421 | | - " <td>1892.519382</td>\n", |
| 421 | + " <td>1783.896317</td>\n", |
422 | 422 | " <td>4</td>\n", |
423 | | - " <td>0</td>\n", |
| 423 | + " <td>1</td>\n", |
424 | 424 | " </tr>\n", |
425 | 425 | " <tr>\n", |
426 | 426 | " <th>4</th>\n", |
427 | 427 | " <td>0</td>\n", |
428 | | - " <td>53.574285</td>\n", |
429 | | - " <td>5</td>\n", |
430 | | - " <td>1114.231039</td>\n", |
| 428 | + " <td>54.019538</td>\n", |
| 429 | + " <td>3</td>\n", |
| 430 | + " <td>791.422965</td>\n", |
431 | 431 | " <td>4</td>\n", |
432 | 432 | " <td>0</td>\n", |
433 | 433 | " </tr>\n", |
|
437 | 437 | ], |
438 | 438 | "text/plain": [ |
439 | 439 | " sex age marital income ls smoke\n", |
440 | | - "0 0 26.155148 4 -8.000000 2 0\n", |
441 | | - "1 1 37.983907 3 1584.939480 4 1\n", |
442 | | - "2 0 67.653086 5 1067.917131 2 0\n", |
443 | | - "3 0 48.066803 3 1892.519382 4 0\n", |
444 | | - "4 0 53.574285 5 1114.231039 4 0" |
| 440 | + "0 1 27.000861 3 5940.743483 4 0\n", |
| 441 | + "1 1 33.685012 3 1747.087586 4 1\n", |
| 442 | + "2 0 76.212963 5 955.997763 2 0\n", |
| 443 | + "3 1 36.493914 3 1783.896317 4 1\n", |
| 444 | + "4 0 54.019538 3 791.422965 4 0" |
445 | 445 | ] |
446 | 446 | }, |
447 | 447 | "metadata": {}, |
|
499 | 499 | " <tbody>\n", |
500 | 500 | " <tr>\n", |
501 | 501 | " <th>0</th>\n", |
502 | | - " <td>FEMALE</td>\n", |
503 | | - " <td>26.155148</td>\n", |
504 | | - " <td>SINGLE</td>\n", |
505 | | - " <td>-8.000000</td>\n", |
506 | | - " <td>MOSTLY DISSATISFIED</td>\n", |
| 502 | + " <td>MALE</td>\n", |
| 503 | + " <td>27.000861</td>\n", |
| 504 | + " <td>MARRIED</td>\n", |
| 505 | + " <td>5940.743483</td>\n", |
| 506 | + " <td>PLEASED</td>\n", |
507 | 507 | " <td>NO</td>\n", |
508 | 508 | " </tr>\n", |
509 | 509 | " <tr>\n", |
510 | 510 | " <th>1</th>\n", |
511 | 511 | " <td>MALE</td>\n", |
512 | | - " <td>37.983907</td>\n", |
| 512 | + " <td>33.685012</td>\n", |
513 | 513 | " <td>MARRIED</td>\n", |
514 | | - " <td>1584.939480</td>\n", |
| 514 | + " <td>1747.087586</td>\n", |
515 | 515 | " <td>PLEASED</td>\n", |
516 | 516 | " <td>YES</td>\n", |
517 | 517 | " </tr>\n", |
518 | 518 | " <tr>\n", |
519 | 519 | " <th>2</th>\n", |
520 | 520 | " <td>FEMALE</td>\n", |
521 | | - " <td>67.653086</td>\n", |
| 521 | + " <td>76.212963</td>\n", |
522 | 522 | " <td>WIDOWED</td>\n", |
523 | | - " <td>1067.917131</td>\n", |
| 523 | + " <td>955.997763</td>\n", |
524 | 524 | " <td>MOSTLY DISSATISFIED</td>\n", |
525 | 525 | " <td>NO</td>\n", |
526 | 526 | " </tr>\n", |
527 | 527 | " <tr>\n", |
528 | 528 | " <th>3</th>\n", |
529 | | - " <td>FEMALE</td>\n", |
530 | | - " <td>48.066803</td>\n", |
| 529 | + " <td>MALE</td>\n", |
| 530 | + " <td>36.493914</td>\n", |
531 | 531 | " <td>MARRIED</td>\n", |
532 | | - " <td>1892.519382</td>\n", |
| 532 | + " <td>1783.896317</td>\n", |
533 | 533 | " <td>PLEASED</td>\n", |
534 | | - " <td>NO</td>\n", |
| 534 | + " <td>YES</td>\n", |
535 | 535 | " </tr>\n", |
536 | 536 | " <tr>\n", |
537 | 537 | " <th>4</th>\n", |
538 | 538 | " <td>FEMALE</td>\n", |
539 | | - " <td>53.574285</td>\n", |
540 | | - " <td>WIDOWED</td>\n", |
541 | | - " <td>1114.231039</td>\n", |
| 539 | + " <td>54.019538</td>\n", |
| 540 | + " <td>MARRIED</td>\n", |
| 541 | + " <td>791.422965</td>\n", |
542 | 542 | " <td>PLEASED</td>\n", |
543 | 543 | " <td>NO</td>\n", |
544 | 544 | " </tr>\n", |
|
548 | 548 | ], |
549 | 549 | "text/plain": [ |
550 | 550 | " sex age marital income ls smoke\n", |
551 | | - "0 FEMALE 26.155148 SINGLE -8.000000 MOSTLY DISSATISFIED NO\n", |
552 | | - "1 MALE 37.983907 MARRIED 1584.939480 PLEASED YES\n", |
553 | | - "2 FEMALE 67.653086 WIDOWED 1067.917131 MOSTLY DISSATISFIED NO\n", |
554 | | - "3 FEMALE 48.066803 MARRIED 1892.519382 PLEASED NO\n", |
555 | | - "4 FEMALE 53.574285 WIDOWED 1114.231039 PLEASED NO" |
| 551 | + "0 MALE 27.000861 MARRIED 5940.743483 PLEASED NO\n", |
| 552 | + "1 MALE 33.685012 MARRIED 1747.087586 PLEASED YES\n", |
| 553 | + "2 FEMALE 76.212963 WIDOWED 955.997763 MOSTLY DISSATISFIED NO\n", |
| 554 | + "3 MALE 36.493914 MARRIED 1783.896317 PLEASED YES\n", |
| 555 | + "4 FEMALE 54.019538 MARRIED 791.422965 PLEASED NO" |
556 | 556 | ] |
557 | 557 | }, |
558 | 558 | "metadata": {}, |
|
633 | 633 | " <td>N/A</td>\n", |
634 | 634 | " <td>N/A</td>\n", |
635 | 635 | " <td>N/A</td>\n", |
636 | | - " <td>0.9364</td>\n", |
| 636 | + " <td>0.9964</td>\n", |
637 | 637 | " <td>N/A</td>\n", |
638 | 638 | " <td>1.0</td>\n", |
639 | 639 | " <td>1.0</td>\n", |
|
643 | 643 | " <td>age</td>\n", |
644 | 644 | " <td>numerical</td>\n", |
645 | 645 | " <td>1.0</td>\n", |
646 | | - " <td>0.934821</td>\n", |
| 646 | + " <td>0.885944</td>\n", |
647 | 647 | " <td>1.0</td>\n", |
648 | | - " <td>0.9368</td>\n", |
| 648 | + " <td>0.9342</td>\n", |
649 | 649 | " <td>N/A</td>\n", |
650 | | - " <td>0.969487</td>\n", |
| 650 | + " <td>0.966491</td>\n", |
651 | 651 | " <td>N/A</td>\n", |
652 | 652 | " <td>N/A</td>\n", |
653 | 653 | " </tr>\n", |
|
659 | 659 | " <td>N/A</td>\n", |
660 | 660 | " <td>N/A</td>\n", |
661 | 661 | " <td>N/A</td>\n", |
662 | | - " <td>0.9574</td>\n", |
| 662 | + " <td>0.975</td>\n", |
663 | 663 | " <td>N/A</td>\n", |
664 | 664 | " <td>0.833333</td>\n", |
665 | 665 | " <td>1.0</td>\n", |
|
669 | 669 | " <td>income</td>\n", |
670 | 670 | " <td>numerical</td>\n", |
671 | 671 | " <td>1.0</td>\n", |
672 | | - " <td>0.936471</td>\n", |
| 672 | + " <td>0.498955</td>\n", |
673 | 673 | " <td>1.0</td>\n", |
674 | | - " <td>0.9036</td>\n", |
| 674 | + " <td>0.8468</td>\n", |
675 | 675 | " <td>N/A</td>\n", |
676 | | - " <td>0.755353</td>\n", |
| 676 | + " <td>0.912639</td>\n", |
677 | 677 | " <td>N/A</td>\n", |
678 | 678 | " <td>N/A</td>\n", |
679 | 679 | " </tr>\n", |
|
685 | 685 | " <td>N/A</td>\n", |
686 | 686 | " <td>N/A</td>\n", |
687 | 687 | " <td>N/A</td>\n", |
688 | | - " <td>0.9278</td>\n", |
| 688 | + " <td>0.9176</td>\n", |
689 | 689 | " <td>N/A</td>\n", |
690 | 690 | " <td>0.857143</td>\n", |
691 | 691 | " <td>1.0</td>\n", |
|
698 | 698 | " <td>N/A</td>\n", |
699 | 699 | " <td>N/A</td>\n", |
700 | 700 | " <td>N/A</td>\n", |
701 | | - " <td>0.9854</td>\n", |
| 701 | + " <td>0.9746</td>\n", |
702 | 702 | " <td>N/A</td>\n", |
703 | 703 | " <td>1.0</td>\n", |
704 | 704 | " <td>1.0</td>\n", |
|
710 | 710 | "text/plain": [ |
711 | 711 | " column type missing_value_similarity range_coverage \\\n", |
712 | 712 | "0 sex categorical 1.0 N/A \n", |
713 | | - "1 age numerical 1.0 0.934821 \n", |
| 713 | + "1 age numerical 1.0 0.885944 \n", |
714 | 714 | "2 marital categorical 1.0 N/A \n", |
715 | | - "3 income numerical 1.0 0.936471 \n", |
| 715 | + "3 income numerical 1.0 0.498955 \n", |
716 | 716 | "4 ls categorical 1.0 N/A \n", |
717 | 717 | "5 smoke categorical 1.0 N/A \n", |
718 | 718 | "\n", |
719 | 719 | " boundary_adherence ks_complement tv_complement statistic_similarity \\\n", |
720 | | - "0 N/A N/A 0.9364 N/A \n", |
721 | | - "1 1.0 0.9368 N/A 0.969487 \n", |
722 | | - "2 N/A N/A 0.9574 N/A \n", |
723 | | - "3 1.0 0.9036 N/A 0.755353 \n", |
724 | | - "4 N/A N/A 0.9278 N/A \n", |
725 | | - "5 N/A N/A 0.9854 N/A \n", |
| 720 | + "0 N/A N/A 0.9964 N/A \n", |
| 721 | + "1 1.0 0.9342 N/A 0.966491 \n", |
| 722 | + "2 N/A N/A 0.975 N/A \n", |
| 723 | + "3 1.0 0.8468 N/A 0.912639 \n", |
| 724 | + "4 N/A N/A 0.9176 N/A \n", |
| 725 | + "5 N/A N/A 0.9746 N/A \n", |
726 | 726 | "\n", |
727 | 727 | " category_coverage category_adherence \n", |
728 | 728 | "0 1.0 1.0 \n", |
|
757 | 757 | "output_type": "stream", |
758 | 758 | "text": [ |
759 | 759 | "=== Regression Efficacy Metrics ===\n", |
760 | | - "{'mse': 1669726.6979087007, 'mae': 904.2202005090558, 'r2': -0.19619130295207743}\n" |
| 760 | + "{'mse': 1455890.3266689673, 'mae': 810.365268015888, 'r2': -0.04299904229518581}\n" |
761 | 761 | ] |
762 | 762 | } |
763 | 763 | ], |
|
782 | 782 | "text": [ |
783 | 783 | "\n", |
784 | 784 | "=== Classification Efficacy Metrics ===\n", |
785 | | - "{'accuracy': 0.6058, 'f1_score': 0.6184739077074358}\n" |
| 785 | + "{'accuracy': 0.64, 'f1_score': 0.6461333333333333}\n" |
786 | 786 | ] |
787 | 787 | } |
788 | 788 | ], |
|
0 commit comments