|
1 | 1 |
|
| 2 | +@article{song_decision_2015, |
| 3 | + title = {Decision tree methods: applications for classification and prediction}, |
| 4 | + volume = {27}, |
| 5 | + issn = {1002-0829}, |
| 6 | + url = {https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4466856/}, |
| 7 | + doi = {10.11919/j.issn.1002-0829.215044}, |
| 8 | + shorttitle = {Decision tree methods}, |
| 9 | + abstract = {Decision tree methodology is a commonly used data mining method for establishing classification systems based on multiple covariates or for developing prediction algorithms for a target variable. This method classifies a population into branch-like segments that construct an inverted tree with a root node, internal nodes, and leaf nodes. The algorithm is non-parametric and can efficiently deal with large, complicated datasets without imposing a complicated parametric structure. When the sample size is large enough, study data can be divided into training and validation datasets. Using the training dataset to build a decision tree model and a validation dataset to decide on the appropriate tree size needed to achieve the optimal final model. This paper introduces frequently used algorithms used to develop decision trees (including {CART}, C4.5, {CHAID}, and {QUEST}) and describes the {SPSS} and {SAS} programs that can be used to visualize tree structure.}, |
| 10 | + pages = {130--135}, |
| 11 | + number = {2}, |
| 12 | + journaltitle = {Shanghai Archives of Psychiatry}, |
| 13 | + shortjournal = {Shanghai Arch Psychiatry}, |
| 14 | + author = {{SONG}, Yan-yan and {LU}, Ying}, |
| 15 | + urldate = {2023-12-17}, |
| 16 | + date = {2015-04-25}, |
| 17 | + pmid = {26120265}, |
| 18 | + pmcid = {PMC4466856}, |
| 19 | +} |
| 20 | + |
| 21 | +@book{rokach_data_2015, |
| 22 | + location = {Hackensack, New Jersey}, |
| 23 | + edition = {Second edition}, |
| 24 | + title = {Data mining with decision trees: theory and applications}, |
| 25 | + isbn = {978-981-4590-07-5}, |
| 26 | + shorttitle = {Data mining with decision trees}, |
| 27 | + pagetotal = {305}, |
| 28 | + publisher = {World Scientific}, |
| 29 | + author = {Rokach, Lior and Maimon, Oded}, |
| 30 | + date = {2015}, |
| 31 | + langid = {english}, |
| 32 | + keywords = {Data mining, Decision support systems, Decision trees, Machine learning}, |
| 33 | +} |
| 34 | + |
| 35 | +@collection{hofmann_rapidminer_2016, |
| 36 | + edition = {0}, |
| 37 | + title = {{RapidMiner}: Data Mining Use Cases and Business Analytics Applications}, |
| 38 | + isbn = {978-0-429-17109-3}, |
| 39 | + url = {https://www.taylorfrancis.com/books/9781482205503}, |
| 40 | + shorttitle = {{RapidMiner}}, |
| 41 | + publisher = {Chapman and Hall/{CRC}}, |
| 42 | + editor = {Hofmann, Markus and Klinkenberg, Ralf}, |
| 43 | + urldate = {2023-12-17}, |
| 44 | + date = {2016-04-19}, |
| 45 | + langid = {english}, |
| 46 | + doi = {10.1201/b16023}, |
| 47 | +} |
| 48 | + |
| 49 | +@online{noauthor_quest-ce_nodate, |
| 50 | + title = {Qu'est-ce que le boosting ? – Le boosting dans le cadre du machine learning expliqué – {AWS}}, |
| 51 | + url = {https://aws.amazon.com/fr/what-is/boosting/}, |
| 52 | + shorttitle = {Qu'est-ce que le boosting ?}, |
| 53 | + abstract = {Découvrez ce qu'est le boosting, comment il fonctionne avec l'{IA}/le {ML} et comment utiliser le boosting dans le cadre du machine learning sur {AWS}.}, |
| 54 | + titleaddon = {Amazon Web Services, Inc.}, |
| 55 | + urldate = {2023-12-17}, |
| 56 | + langid = {french}, |
| 57 | +} |
| 58 | + |
| 59 | +@article{haixiang_learning_2017, |
| 60 | + title = {Learning from class-imbalanced data: Review of methods and applications}, |
| 61 | + volume = {73}, |
| 62 | + issn = {0957-4174}, |
| 63 | + url = {https://www.sciencedirect.com/science/article/pii/S0957417416307175}, |
| 64 | + doi = {10.1016/j.eswa.2016.12.035}, |
| 65 | + shorttitle = {Learning from class-imbalanced data}, |
| 66 | + abstract = {Rare events, especially those that could potentially negatively impact society, often require humans’ decision-making responses. Detecting rare events can be viewed as a prediction task in data mining and machine learning communities. As these events are rarely observed in daily life, the prediction task suffers from a lack of balanced data. In this paper, we provide an in depth review of rare event detection from an imbalanced learning perspective. Five hundred and seventeen related papers that have been published in the past decade were collected for the study. The initial statistics suggested that rare events detection and imbalanced learning are concerned across a wide range of research areas from management science to engineering. We reviewed all collected papers from both a technical and a practical point of view. Modeling methods discussed include techniques such as data preprocessing, classification algorithms and model evaluation. For applications, we first provide a comprehensive taxonomy of the existing application domains of imbalanced learning, and then we detail the applications for each category. Finally, some suggestions from the reviewed papers are incorporated with our experiences and judgments to offer further research directions for the imbalanced learning and rare event detection fields.}, |
| 67 | + pages = {220--239}, |
| 68 | + journaltitle = {Expert Systems with Applications}, |
| 69 | + shortjournal = {Expert Systems with Applications}, |
| 70 | + author = {Haixiang, Guo and Yijing, Li and Shang, Jennifer and Mingyun, Gu and Yuanyue, Huang and Bing, Gong}, |
| 71 | + urldate = {2023-12-17}, |
| 72 | + date = {2017-05-01}, |
| 73 | + keywords = {Data mining, Imbalanced data, Machine learning, Rare events}, |
| 74 | +} |
| 75 | + |
| 76 | +@article{galar_review_2012, |
| 77 | + title = {A Review on Ensembles for the Class Imbalance Problem: Bagging-, Boosting-, and Hybrid-Based Approaches}, |
| 78 | + volume = {42}, |
| 79 | + issn = {1558-2442}, |
| 80 | + url = {https://ieeexplore.ieee.org/document/5978225}, |
| 81 | + doi = {10.1109/TSMCC.2011.2161285}, |
| 82 | + shorttitle = {A Review on Ensembles for the Class Imbalance Problem}, |
| 83 | + abstract = {Classifier learning with data-sets that suffer from imbalanced class distributions is a challenging problem in data mining community. This issue occurs when the number of examples that represent one class is much lower than the ones of the other classes. Its presence in many real-world applications has brought along a growth of attention from researchers. In machine learning, the ensemble of classifiers are known to increase the accuracy of single classifiers by combining several of them, but neither of these learning techniques alone solve the class imbalance problem, to deal with this issue the ensemble learning algorithms have to be designed specifically. In this paper, our aim is to review the state of the art on ensemble techniques in the framework of imbalanced data-sets, with focus on two-class problems. We propose a taxonomy for ensemble-based methods to address the class imbalance where each proposal can be categorized depending on the inner ensemble methodology in which it is based. In addition, we develop a thorough empirical comparison by the consideration of the most significant published approaches, within the families of the taxonomy proposed, to show whether any of them makes a difference. This comparison has shown the good behavior of the simplest approaches which combine random undersampling techniques with bagging or boosting ensembles. In addition, the positive synergy between sampling techniques and bagging has stood out. Furthermore, our results show empirically that ensemble-based algorithms are worthwhile since they outperform the mere use of preprocessing techniques before learning the classifier, therefore justifying the increase of complexity by means of a significant enhancement of the results.}, |
| 84 | + pages = {463--484}, |
| 85 | + number = {4}, |
| 86 | + journaltitle = {{IEEE} Transactions on Systems, Man, and Cybernetics, Part C (Applications and Reviews)}, |
| 87 | + author = {Galar, Mikel and Fernandez, Alberto and Barrenechea, Edurne and Bustince, Humberto and Herrera, Francisco}, |
| 88 | + urldate = {2023-12-17}, |
| 89 | + date = {2012-07}, |
| 90 | + note = {Conference Name: {IEEE} Transactions on Systems, Man, and Cybernetics, Part C (Applications and Reviews)}, |
| 91 | +} |
| 92 | + |
2 | 93 | @book{durkheim_suicide_1951, |
3 | 94 | title = {Suicide, a Study in Sociology}, |
4 | 95 | isbn = {978-0-02-908660-5}, |
|
0 commit comments