@article{3220967, title = "Text mining and word embedding for classification of decision making variables in breast cancer surgery", author = "Catanuto, G. and Rocco, N. and Maglia, A. and Barry, P. and Karakatsanis, A. and Sgroi, G. and Russo, G. and Pappalardo, F. and Nava, M.B. and Heil, J. and Karakatsanis, A. and Weber, W.P. and Gonzalez, E. and Chatterjee, A. and Urban, C. and Sund, M. and Paulinelli, R.R. and Markopoulos, C. and Rubio, I.T. and Masannat, Y.A. and Meani, F. and Koppiker, C.B. and Holcombe, C. and Benson, J.R. and Dietz, J.R. and Walker, M. and Mátrai, Z. and Shaukat, A. and Gulluoglu, B. and Brenelli, F. and Fitzal, F. and Mele, M. and ETHOS Collaborative Group", journal = "European Journal of Surgical Oncology", year = "2022", publisher = "W.B. Saunders Ltd", issn = "0748-7983", doi = "10.1016/j.ejso.2022.03.002", abstract = "Introduction: Decision making in surgical oncology of the breast has increased its complexity over the last twenty years. This Delphi survey investigates the opinion of an expert panel about the decision making process in surgical procedures on the breast for oncological purposes. Methods: Twenty-seven experts were invited to partake into a Delphi Survey. At the first round they have been asked to provide a list of features involved in the decision making process (patient's characteristics; disease characteristics; surgical techniques, outcomes) and comment on it. Using text-mining techniques we extracted a list of mono-bi-trigrams potentially representative of decision drivers. A technique of “natural language processing” called Word2vec was used to validate changes to texts using synonyms and plesionyms. Word2Vec was also used to test the semantic relevance of n-grams within a corpus of knowledge made up of books edited by panel members. The final list of variables extracted was submitted to the judgement of the panel for final validation at the second round of the Delphi using closed ended questions. Results: 52 features out of 59 have been approved by the panel. The overall consensus was 87.1% Conclusions: Text mining and natural language processing allowed the extraction of a number of decision drivers and outcomes as part of the decision making process in surgical oncology on the breast. This result was obtained transforming narrative texts into structured data. The high level of consensus among experts provided validation to this process. © 2022 Elsevier Ltd, BASO ~ The Association for Cancer Surgery, and the European Society of Surgical Oncology" }