@article {1532, title = {Mobility Constraints in Segregation Models}, journal = {Scientific Reports}, volume = {13}, year = {2023}, pages = {12087}, abstract = {Since the development of the original Schelling model of urban segregation, several enhancements have been proposed, but none have considered the impact of mobility constraints on model dynamics. Recent studies have shown that human mobility follows specific patterns, such as a preference for short distances and dense locations. This paper proposes a segregation model incorporating mobility constraints to make agents select their location based on distance and location relevance. Our findings indicate that the mobility-constrained model produces lower segregation levels but takes longer to converge than the original Schelling model. We identified a few persistently unhappy agents from the minority group who cause this prolonged convergence time and lower segregation level as they move around the grid centre. Our study presents a more realistic representation of how agents move in urban areas and provides a novel and insightful approach to analyzing the impact of mobility constraints on segregation models. We highlight the significance of incorporating mobility constraints when policymakers design interventions to address urban segregation.}, doi = {10.1038/s41598-023-38519-6}, author = {Daniele Gambetta and Giovanni Mauro and Luca Pappalardo} } @conference {1493, title = {Connected Vehicle Simulation Framework for Parking Occupancy Prediction (Demo Paper)}, booktitle = {Proceedings of the 30th International Conference on Advances in Geographic Information Systems}, year = {2022}, publisher = {Association for Computing Machinery}, organization = {Association for Computing Machinery}, address = {New York, NY, USA}, abstract = {This paper demonstrates a simulation framework that collects data about connected vehicles{\textquoteright} locations and surroundings in a realistic traffic scenario. Our focus lies on the capability to detect parking spots and their occupancy status. We use this data to train machine learning models that predict parking occupancy levels of specific areas in the city center of San Francisco. By comparing their performance to a given ground truth, our results show that it is possible to use simulated connected vehicle data as a base for prototyping meaningful AI-based applications.}, isbn = {9781450395298}, doi = {10.1145/3557915.3560995}, url = {https://doi.org/10.1145/3557915.3560995}, author = {Resce, Pierpaolo and Vorwerk, Lukas and Han, Zhiwei and Cornacchia, Giuliano and Alamdari, Omid Isfahani and Mirco Nanni and Luca Pappalardo and Weimer, Daniel and Liu, Yuanting} } @article {1531, title = {Generating mobility networks with generative adversarial networks}, journal = {EPJ data science}, volume = {11}, number = {1}, year = {2022}, pages = {58}, abstract = {The increasingly crucial role of human displacements in complex societal phenomena, such as traffic congestion, segregation, and the diffusion of epidemics, is attracting the interest of scientists from several disciplines. In this article, we address mobility network generation, i.e., generating a city{\textquoteright}s entire mobility network, a weighted directed graph in which nodes are geographic locations and weighted edges represent people{\textquoteright}s movements between those locations, thus describing the entire mobility set flows within a city. Our solution is MoGAN, a model based on Generative Adversarial Networks (GANs) to generate realistic mobility networks. We conduct extensive experiments on public datasets of bike and taxi rides to show that MoGAN outperforms the classical Gravity and Radiation models regarding the realism of the generated networks. Our model can be used for data augmentation and performing simulations and what-if analysis.}, doi = {https://doi.org/10.1140/epjds/s13688-022-00372-4}, author = {Giovanni Mauro and Luca, Massimiliano and Longa, Antonio and Lepri, Bruno and Luca Pappalardo} } @conference {1492, title = {How Routing Strategies Impact Urban Emissions}, booktitle = {Proceedings of the 30th International Conference on Advances in Geographic Information Systems}, year = {2022}, publisher = {Association for Computing Machinery}, organization = {Association for Computing Machinery}, address = {New York, NY, USA}, abstract = {Navigation apps use routing algorithms to suggest the best path to reach a user{\textquoteright}s desired destination. Although undoubtedly useful, navigation apps{\textquoteright} impact on the urban environment (e.g., CO2 emissions and pollution) is still largely unclear. In this work, we design a simulation framework to assess the impact of routing algorithms on carbon dioxide emissions within an urban environment. Using APIs from TomTom and OpenStreetMap, we find that settings in which either all vehicles or none of them follow a navigation app{\textquoteright}s suggestion lead to the worst impact in terms of CO2 emissions. In contrast, when just a portion (around half) of vehicles follow these suggestions, and some degree of randomness is added to the remaining vehicles{\textquoteright} paths, we observe a reduction in the overall CO2 emissions over the road network. Our work is a first step towards designing next-generation routing principles that may increase urban well-being while satisfying individual needs.}, isbn = {9781450395298}, doi = {10.1145/3557915.3560977}, url = {https://doi.org/10.1145/3557915.3560977}, author = {Cornacchia, Giuliano and B{\"o}hm, Matteo and Giovanni Mauro and Mirco Nanni and Dino Pedreschi and Luca Pappalardo} } @article {1470, title = {Explaining the difference between men{\textquoteright}s and women{\textquoteright}s football}, journal = {PLOS ONE}, volume = {16}, year = {2021}, month = {Apr-08-2021}, pages = {e0255407}, abstract = {Women{\textquoteright}s football is gaining supporters and practitioners worldwide, raising questions about what the differences are with men{\textquoteright}s football. While the two sports are often compared based on the players{\textquoteright} physical attributes, we analyze the spatio-temporal events during matches in the last World Cups to compare male and female teams based on their technical performance. We train an artificial intelligence model to recognize if a team is male or female based on variables that describe a match{\textquoteright}s playing intensity, accuracy, and performance quality. Our model accurately distinguishes between men{\textquoteright}s and women{\textquoteright}s football, revealing crucial technical differences, which we investigate through the extraction of explanations from the classifier{\textquoteright}s decisions. The differences between men{\textquoteright}s and women{\textquoteright}s football are rooted in play accuracy, the recovery time of ball possession, and the players{\textquoteright} performance quality. Our methodology may help journalists and fans understand what makes women{\textquoteright}s football a distinct sport and coaches design tactics tailored to female teams.}, doi = {https://doi.org/10.1371/journal.pone.0255407}, url = {https://journals.plos.org/plosone/article?id=10.1371/journal.pone.0255407}, author = {Luca Pappalardo and Alessio Rossi and Michela Natilli and Paolo Cintia}, editor = {Constantinou, Anthony C.} } @article {1435, title = {Introduction to the special issue on social mining and big data ecosystem for open, responsible data science}, year = {2021}, month = {2021/03/05}, isbn = {2364-4168}, doi = {https://link.springer.com/article/10.1007/s41060-021-00253-5}, url = {https://doi.org/10.1007/s41060-021-00253-5}, author = {Luca Pappalardo and Grossi, Valerio and Dino Pedreschi} } @article {1463, title = {A Mechanistic Data-Driven Approach to Synthesize Human Mobility Considering the Spatial, Temporal, and Social Dimensions Together}, journal = {ISPRS International Journal of Geo-Information}, volume = {10}, number = {9}, year = {2021}, pages = {599}, abstract = {Modelling human mobility is crucial in several areas, from urban planning to epidemic modelling, traffic forecasting, and what-if analysis. Existing generative models focus mainly on reproducing the spatial and temporal dimensions of human mobility, while the social aspect, though it influences human movements significantly, is often neglected. Those models that capture some social perspectives of human mobility utilize trivial and unrealistic spatial and temporal mechanisms. In this paper, we propose the Spatial, Temporal and Social Exploration and Preferential Return model (STS-EPR), which embeds mechanisms to capture the spatial, temporal, and social aspects together. We compare the trajectories produced by STS-EPR with respect to real-world trajectories and synthetic trajectories generated by two state-of-the-art generative models on a set of standard mobility measures. Our experiments conducted on an open dataset show that STS-EPR, overall, outperforms existing spatial-temporal or social models demonstrating the importance of modelling adequately the sociality to capture precisely all the other dimensions of human mobility. We further investigate the impact of the tile shape of the spatial tessellation on the performance of our model. STS-EPR, which is open-source and tested on open data, represents a step towards the design of a mechanistic data-driven model that captures all the aspects of human mobility comprehensively.}, issn = {2220-9964}, doi = {10.3390/ijgi10090599}, url = {https://www.mdpi.com/2220-9964/10/9/599}, author = {Cornacchia, Giuliano and Luca Pappalardo} } @article {1449, title = {STS-EPR: Modelling individual mobility considering the spatial, temporal, and social dimensions together}, year = {2021}, month = {05}, doi = {10.1016/j.procs.2021.03.035}, author = {Cornacchia, Giuliano and Luca Pappalardo} } @conference {1420, title = {Estimating countries{\textquoteright} peace index through the lens of the world news as monitored by GDELT}, booktitle = {2020 IEEE 7th International Conference on Data Science and Advanced Analytics (DSAA)2020 IEEE 7th International Conference on Data Science and Advanced Analytics (DSAA)}, year = {2020}, month = {2020}, abstract = {Peacefulness is a principal dimension of well-being, and its measurement has lately drawn the attention of researchers and policy-makers. During the last years, novel digital data streams have drastically changed research in this field. In the current study, we exploit information extracted from Global Data on Events, Location, and Tone (GDELT) digital news database, to capture peacefulness through the Global Peace Index (GPI). Applying machine learning techniques, we demonstrate that news media attention, sentiment, and social stability from GDELT can be used as proxies for measuring GPI at a monthly level. Additionally, through the variable importance analysis, we show that each country{\textquoteright}s socio-economic, political, and military profile emerges. This could bring added value to researchers interested in "Data Science for Social Good", to policy-makers, and peacekeeping organizations since they could monitor peacefulness almost real-time, and therefore facilitate timely and more efficient policy-making. }, doi = {https://doi.org/10.1109/DSAA49011.2020.00034}, url = {https://ieeexplore.ieee.org/abstract/document/9260052}, author = {V. Voukelatou and Luca Pappalardo and Lorenzo Gabrielli and Fosca Giannotti} } @article {1404, title = {Human migration: the big data perspective}, journal = {International Journal of Data Science and Analytics}, year = {2020}, month = {2020/03/23}, pages = {1{\textendash}20}, abstract = {How can big data help to understand the migration phenomenon? In this paper, we try to answer this question through an analysis of various phases of migration, comparing traditional and novel data sources and models at each phase. We concentrate on three phases of migration, at each phase describing the state of the art and recent developments and ideas. The first phase includes the journey, and we study migration flows and stocks, providing examples where big data can have an impact. The second phase discusses the stay, i.e. migrant integration in the destination country. We explore various data sets and models that can be used to quantify and understand migrant integration, with the final aim of providing the basis for the construction of a novel multi-level integration index. The last phase is related to the effects of migration on the source countries and the return of migrants.}, isbn = {2364-4168}, doi = {https://doi.org/10.1007/s41060-020-00213-5}, url = {https://link.springer.com/article/10.1007\%2Fs41060-020-00213-5}, author = {Alina Sirbu and Andrienko, Gennady and Andrienko, Natalia and Boldrini, Chiara and Conti, Marco and Fosca Giannotti and Riccardo Guidotti and Bertoli, Simone and Jisu Kim and Muntean, Cristina Ioana and Luca Pappalardo and Passarella, Andrea and Dino Pedreschi and Pollacci, Laura and Francesca Pratesi and Sharma, Rajesh} } @booklet {1425, title = {Mobile phone data analytics against the COVID-19 epidemics in Italy: flow diversity and local job markets during the national lockdown}, year = {2020}, abstract = {Understanding collective mobility patterns is crucial to plan the restart of production and economic activities, which are currently put in stand-by to fight the diffusion of the epidemics. In this report, we use mobile phone data to infer the movements of people between Italian provinces and municipalities, and we analyze the incoming, outcoming and internal mobility flows before and during the national lockdown (March 9th, 2020) and after the closure of non-necessary productive and economic activities (March 23th, 2020). The population flow across provinces and municipalities enable for the modelling of a risk index tailored for the mobility of each municipality or province. Such an index would be a useful indicator to drive counter-measures in reaction to a sudden reactivation of the epidemics. Mobile phone data, even when aggregated to preserve the privacy of individuals, are a useful data source to track the evolution in time of human mobility, hence allowing for monitoring the effectiveness of control measures such as physical distancing. We address the following analytical questions: How does the mobility structure of a territory change? Do incoming and outcoming flows become more predictable during the lockdown, and what are the differences between weekdays and weekends? Can we detect proper local job markets based on human mobility flows, to eventually shape the borders of a local outbreak?}, doi = {https://dx.doi.org/10.32079/ISTI-TR-2020/005}, url = {https://arxiv.org/abs/2004.11278}, author = {Pietro Bonato and Paolo Cintia and Francesco Fabbri and Daniele Fadda and Fosca Giannotti and Pier Luigi Lopalco and Sara Mazzilli and Mirco Nanni and Luca Pappalardo and Dino Pedreschi and Francesco Penone and S Rinzivillo and Giulio Rossetti and Marcello Savarese and Lara Tavoschi} } @article {1410, title = {Modeling Adversarial Behavior Against Mobility Data Privacy}, journal = {IEEE Transactions on Intelligent Transportation SystemsIEEE Transactions on Intelligent Transportation Systems}, year = {2020}, month = {2020}, pages = {1 - 14}, abstract = {Privacy risk assessment is a crucial issue in any privacy-aware analysis process. Traditional frameworks for privacy risk assessment systematically generate the assumed knowledge for a potential adversary, evaluating the risk without realistically modelling the collection of the background knowledge used by the adversary when performing the attack. In this work, we propose Simulated Privacy Annealing (SPA), a new adversarial behavior model for privacy risk assessment in mobility data. We model the behavior of an adversary as a mobility trajectory and introduce an optimization approach to find the most effective adversary trajectory in terms of privacy risk produced for the individuals represented in a mobility data set. We use simulated annealing to optimize the movement of the adversary and simulate a possible attack on mobility data. We finally test the effectiveness of our approach on real human mobility data, showing that it can simulate the knowledge gathering process for an adversary in a more realistic way.}, isbn = {1558-0016}, doi = {https://doi.org/10.1109/TITS.2020.3021911}, url = {https://ieeexplore.ieee.org/abstract/document/9199893}, author = {Roberto Pellungrini and Luca Pappalardo and F. Simini and Anna Monreale} } @article {1368, title = {Modelling Human Mobility considering Spatial, Temporal and Social Dimensions}, journal = {arXiv preprint arXiv:2007.02371}, year = {2020}, author = {Cornacchia, Giuliano and Giulio Rossetti and Luca Pappalardo} } @article {1339, title = {The relationship between human mobility and viral transmissibility during the COVID-19 epidemics in Italy}, journal = {arXiv preprint arXiv:2006.03141}, year = {2020}, abstract = {We describe in this report our studies to understand the relationship between human mobility and the spreading of COVID-19, as an aid to manage the restart of the social and economic activities after the lockdown and monitor the epidemics in the coming weeks and months. We compare the evolution (from January to May 2020) of the daily mobility flows in Italy, measured by means of nation-wide mobile phone data, and the evolution of transmissibility, measured by the net reproduction number, i.e., the mean number of secondary infections generated by one primary infector in the presence of control interventions and human behavioural adaptations. We find a striking relationship between the negative variation of mobility flows and the net reproduction number, in all Italian regions, between March 11th and March 18th, when the country entered the lockdown. This observation allows us to quantify the time needed to "switch off" the country mobility (one week) and the time required to bring the net reproduction number below 1 (one week). A reasonably simple regression model provides evidence that the net reproduction number is correlated with a region{\textquoteright}s incoming, outgoing and internal mobility. We also find a strong relationship between the number of days above the epidemic threshold before the mobility flows reduce significantly as an effect of lockdowns, and the total number of confirmed SARS-CoV-2 infections per 100k inhabitants, thus indirectly showing the effectiveness of the lockdown and the other non-pharmaceutical interventions in the containment of the contagion. Our study demonstrates the value of "big" mobility data to the monitoring of key epidemic indicators to inform choices as the epidemics unfolds in the coming months.}, url = {https://arxiv.org/abs/2006.03141}, author = {Paolo Cintia and Daniele Fadda and Fosca Giannotti and Luca Pappalardo and Giulio Rossetti and Dino Pedreschi and S Rinzivillo and Bonato, Pietro and Fabbri, Francesco and Penone, Francesco and Savarese, Marcello and Checchi, Daniele and Chiaromonte, Francesca and Vineis , Paolo and Guzzetta, Giorgio and Riccardo, Flavia and Marziano, Valentina and Poletti, Piero and Trentini, Filippo and Bella, Antonio and Andrianou, Xanthi and Del Manso, Martina and Fabiani, Massimo and Bellino, Stefania and Boros, Stefano and Mateo Urdiales, Alberto and Vescio, Maria Fenicia and Brusaferro, Silvio and Rezza, Giovanni and Pezzotti, Patrizio and Ajelli, Marco and Merler, Stefano} } @article {1265, title = {Defining Geographic Markets from Probabilistic Clusters: A Machine Learning Algorithm Applied to Supermarket Scanner Data}, journal = {Available at SSRN 3452058}, year = {2019}, author = {Bruestle, Stephen and Luca Pappalardo and Riccardo Guidotti} } @conference {1195, title = {Human Mobility from theory to practice: Data, Models and Applications}, booktitle = {Companion of The 2019 World Wide Web Conference, WWW 2019, San Francisco, CA, USA, May 13-17, 2019.}, year = {2019}, abstract = {The inclusion of tracking technologies in personal devices opened the doors to the analysis of large sets of mobility data like GPS traces and call detail records. This tutorial presents an overview of both modeling principles of human mobility and machine learning models applicable to specific problems. We review the state of the art of five main aspects in human mobility: (1) human mobility data landscape; (2) key measures of individual and collective mobility; (3) generative models at the level of individual, population and mixture of the two; (4) next location prediction algorithms; (5) applications for social good. For each aspect, we show experiments and simulations using the Python library {\textquotedblright}scikit-mobility{\textquotedblright} developed by the presenters of the tutorial.}, doi = {10.1145/3308560.3320099}, url = {https://doi.org/10.1145/3308560.3320099}, author = {Luca Pappalardo and Gianni Barlacchi and Roberto Pellungrini and Filippo Simini} } @article {1294, title = {PlayeRank: data-driven performance evaluation and player ranking in soccer via a machine learning approach}, journal = {ACM Transactions on Intelligent Systems and Technology (TIST)}, volume = {10}, number = {5}, year = {2019}, pages = {1{\textendash}27}, abstract = {The problem of evaluating the performance of soccer players is attracting the interest of many companies and the scientific community, thanks to the availability of massive data capturing all the events generated during a match (e.g., tackles, passes, shots, etc.). Unfortunately, there is no consolidated and widely accepted metric for measuring performance quality in all of its facets. In this article, we design and implement PlayeRank, a data-driven framework that offers a principled multi-dimensional and role-aware evaluation of the performance of soccer players. We build our framework by deploying a massive dataset of soccer-logs and consisting of millions of match events pertaining to four seasons of 18 prominent soccer competitions. By comparing PlayeRank to known algorithms for performance evaluation in soccer, and by exploiting a dataset of players{\textquoteright} evaluations made by professional soccer scouts, we show that PlayeRank significantly outperforms the competitors. We also explore the ratings produced by PlayeRank and discover interesting patterns about the nature of excellent performances and what distinguishes the top players from the others. At the end, we explore some applications of PlayeRank{\textemdash}i.e. searching players and player versatility{\textemdash}showing its flexibility and efficiency, which makes it worth to be used in the design of a scalable platform for soccer analytics.}, doi = {10.1145/3343172}, url = {https://dl.acm.org/doi/abs/10.1145/3343172}, author = {Luca Pappalardo and Paolo Cintia and Ferragina, Paolo and Massucco, Emanuele and Dino Pedreschi and Fosca Giannotti} } @article {1266, title = {A public data set of spatio-temporal match events in soccer competitions}, journal = {Scientific data}, volume = {6}, number = {1}, year = {2019}, pages = {1{\textendash}15}, abstract = {Soccer analytics is attracting increasing interest in academia and industry, thanks to the availability of sensing technologies that provide high-fidelity data streams for every match. Unfortunately, these detailed data are owned by specialized companies and hence are rarely publicly available for scientific research. To fill this gap, this paper describes the largest open collection of soccer-logs ever released, containing all the spatio-temporal events (passes, shots, fouls, etc.) that occured during each match for an entire season of seven prominent soccer competitions. Each match event contains information about its position, time, outcome, player and characteristics. The nature of team sports like soccer, halfway between the abstraction of a game and the reality of complex social systems, combined with the unique size and composition of this dataset, provide an ideal ground for tackling a wide range of data science problems, including the measurement and evaluation of performance, both at individual and at collective level, and the determinants of success and failure.}, doi = {10.1038/s41597-019-0247-7}, url = {https://www.nature.com/articles/s41597-019-0247-7}, author = {Luca Pappalardo and Paolo Cintia and Alessio Rossi and Massucco, Emanuele and Ferragina, Paolo and Dino Pedreschi and Fosca Giannotti} } @article {1295, title = {Relationship between External and Internal Workloads in Elite Soccer Players: Comparison between Rate of Perceived Exertion and Training Load}, journal = {Applied Sciences}, volume = {9}, number = {23}, year = {2019}, pages = {5174}, abstract = {The use of machine learning (ML) in soccer allows for the management of a large amount of data deriving from the monitoring of sessions and matches. Although the rate of perceived exertion (RPE), training load (S-RPE), and global position system (GPS) are standard methodologies used in team sports to assess the internal and external workload; how the external workload affects RPE and S-RPE remains still unclear. This study explores the relationship between both RPE and S-RPE and the training workload through ML. Data were recorded from 22 elite soccer players, in 160 training sessions and 35 matches during the 2015/2016 season, by using GPS tracking technology. A feature selection process was applied to understand which workload features influence RPE and S-RPE the most. Our results show that the training workloads performed in the previous week have a strong effect on perceived exertion and training load. On the other hand, the analysis of our predictions shows higher accuracy for medium RPE and S-RPE values compared with the extremes. These results provide further evidence of the usefulness of ML as a support to athletic trainers and coaches in understanding the relationship between training load and individual-response in team sports.}, doi = {10.3390/app9235174}, url = {https://www.mdpi.com/2076-3417/9/23/5174/htm}, author = {Alessio Rossi and Perri, Enrico and Luca Pappalardo and Paolo Cintia and Iaia, F Marcello} } @conference {1197, title = {Analyzing Privacy Risk in Human Mobility Data}, booktitle = {Software Technologies: Applications and Foundations - STAF 2018 Collocated Workshops, Toulouse, France, June 25-29, 2018, Revised Selected Papers}, year = {2018}, abstract = {Mobility data are of fundamental importance for understanding the patterns of human movements, developing analytical services and modeling human dynamics. Unfortunately, mobility data also contain individual sensitive information, making it necessary an accurate privacy risk assessment for the individuals involved. In this paper, we propose a methodology for assessing privacy risk in human mobility data. Given a set of individual and collective mobility features, we define the minimum data format necessary for the computation of each feature and we define a set of possible attacks on these data formats. We perform experiments computing the empirical risk in a real-world mobility dataset, and show how the distributions of the considered mobility features are affected by the removal of individuals with different levels of privacy risk.}, doi = {10.1007/978-3-030-04771-9_10}, url = {https://doi.org/10.1007/978-3-030-04771-9_10}, author = {Roberto Pellungrini and Luca Pappalardo and Francesca Pratesi and Anna Monreale} } @article {1086, title = {Effective injury forecasting in soccer with GPS training data and machine learning}, journal = {PloS one}, volume = {13}, number = {7}, year = {2018}, pages = {e0201264}, abstract = {Injuries have a great impact on professional soccer, due to their large influence on team performance and the considerable costs of rehabilitation for players. Existing studies in the literature provide just a preliminary understanding of which factors mostly affect injury risk, while an evaluation of the potential of statistical models in forecasting injuries is still missing. In this paper, we propose a multi-dimensional approach to injury forecasting in professional soccer that is based on GPS measurements and machine learning. By using GPS tracking technology, we collect data describing the training workload of players in a professional soccer club during a season. We then construct an injury forecaster and show that it is both accurate and interpretable by providing a set of case studies of interest to soccer practitioners. Our approach opens a novel perspective on injury prevention, providing a set of simple and practical rules for evaluating and interpreting the complex relations between injury risk and training performance in professional soccer.}, doi = {https://doi.org/10.1371/journal.pone.0201264}, url = {https://journals.plos.org/plosone/article?id=10.1371/journal.pone.0201264}, author = {Alessio Rossi and Luca Pappalardo and Paolo Cintia and Iaia, F Marcello and Fern{\`a}ndez, Javier and Medina, Daniel} } @conference {1269, title = {Exploring Students Eating Habits Through Individual Profiling and Clustering Analysis}, booktitle = {ECML PKDD 2018 Workshops}, year = {2018}, publisher = {Springer}, organization = {Springer}, author = {Michela Natilli and Anna Monreale and Riccardo Guidotti and Luca Pappalardo} } @article {1194, title = {Gastroesophageal reflux symptoms among Italian university students: epidemiology and dietary correlates using automatically recorded transactions}, journal = {BMC gastroenterology}, volume = {18}, number = {1}, year = {2018}, pages = {116}, abstract = {Background: Gastroesophageal reflux disease (GERD) is one of the most common gastrointestinal disorders worldwide, with relevant impact on the quality of life and health care costs.The aim of our study is to assess the prevalence of GERD based on self-reported symptoms among university students in central Italy. The secondary aim is to evaluate lifestyle correlates, particularly eating habits, in GERD students using automatically recorded transactions through cashiers at university canteen. Methods: A web-survey was created and launched through an app, ad-hoc developed for an interactive exchange of information with students, including anthropometric data and lifestyle habits. Moreover, the web-survey allowed users a self-diagnosis of GERD through a simple questionnaire. As regard eating habits, detailed collection of meals consumed, including number and type of dishes, were automatically recorded through cashiers at the university canteen equipped with an automatic registration system. Results: We collected 3012 questionnaires. A total of 792 students (26.2\% of the respondents) reported typical GERD symptoms occurring at least weekly. Female sex was more prevalent than male sex. In the set of students with GERD, the percentage of smokers was higher, and our results showed that when BMI tends to higher values the percentage of students with GERD tends to increase. When evaluating correlates with diet, we found, among all users, a lower frequency of legumes choice in GERD students and, among frequent users, a lower frequency of choice of pasta and rice in GERD students. Discussion: The results of our study are in line with the values reported in the literature. Nowadays, GERD is a common problem in our communities, and can potentially lead to serious medical complications; the economic burden involved in the diagnostic and therapeutic management of the disease has a relevant impact on healthcare costs. Conclusions: To our knowledge, this is the first study evaluating the prevalence of typical GERD{\textendash}related symptoms in a young population of University students in Italy. Considering the young age of enrolled subjects, our prevalence rate, relatively high compared to the usual estimates, could represent a further negative factor for the future economic sustainability of the healthcare system. Keywords: Gastroesophageal reflux disease, GERD, Heartburn, Regurgitation, Diet, Prevalence, University students}, doi = {10.1186/s12876-018-0832-9}, url = {https://bmcgastroenterol.biomedcentral.com/articles/10.1186/s12876-018-0832-9}, author = {Martinucci, Irene and Michela Natilli and Lorenzoni, Valentina and Luca Pappalardo and Anna Monreale and Turchetti, Giuseppe and Dino Pedreschi and Marchi, Santino and Barale, Roberto and de Bortoli, Nicola} } @article {1193, title = {Gravity and scaling laws of city to city migration}, journal = {PLOS ONE}, volume = {13}, number = {7}, year = {2018}, month = {07}, pages = {1-19}, abstract = {Models of human migration provide powerful tools to forecast the flow of migrants, measure the impact of a policy, determine the cost of physical and political frictions and more. Here, we analyse the migration of individuals from and to cities in the US, finding that city to city migration follows scaling laws, so that the city size is a significant factor in determining whether, or not, an individual decides to migrate and the city size of both the origin and destination play key roles in the selection of the destination. We observe that individuals from small cities tend to migrate more frequently, tending to move to similar-sized cities, whereas individuals from large cities do not migrate so often, but when they do, they tend to move to other large cities. Building upon these findings we develop a scaling model which describes internal migration as a two-step decision process, demonstrating that it can partially explain migration fluxes based solely on city size. We then consider the impact of distance and construct a gravity-scaling model by combining the observed scaling patterns with the gravity law of migration. Results show that the scaling laws are a significant feature of human migration and that the inclusion of scaling can overcome the limits of the gravity and the radiation models of human migration.}, doi = {10.1371/journal.pone.0199892}, url = {https://doi.org/10.1371/journal.pone.0199892}, author = {Prieto Curiel, Rafael and Luca Pappalardo and Lorenzo Gabrielli and Bishop, Steven Richard} } @inbook {1422, title = {How Data Mining and Machine Learning Evolved from Relational Data Base to Data Science}, booktitle = {A Comprehensive Guide Through the Italian Database Research Over the Last 25 Years}, year = {2018}, pages = {287 - 306}, publisher = {Springer International Publishing}, organization = {Springer International Publishing}, address = {Cham}, abstract = {During the last 35 years, data management principles such as physical and logical independence, declarative querying and cost-based optimization have led to profound pervasiveness of relational databases in any kind of organization. More importantly, these technical advances have enabled the first round of business intelligence applications and laid the foundation for managing and analyzing Big Data today.}, isbn = {978-3-319-61893-7}, doi = {https://doi.org/10.1007/978-3-319-61893-7_17}, url = {https://link.springer.com/chapter/10.1007\%2F978-3-319-61893-7_17}, author = {Amato, G. and Candela, L. and Castelli, D. and Esuli, A. and Falchi, F. and Gennaro, C. and Fosca Giannotti and Anna Monreale and Mirco Nanni and Pagano, P. and Luca Pappalardo and Dino Pedreschi and Francesca Pratesi and Rabitti, F. and S Rinzivillo and Giulio Rossetti and Salvatore Ruggieri and Sebastiani, F. and Tesconi, M.}, editor = {Flesca, Sergio and Greco, Sergio and Masciari, Elio and Sacc{\`a}, Domenico} } @article {1132, title = {Open the Black Box Data-Driven Explanation of Black Box Decision Systems}, year = {2018}, author = {Dino Pedreschi and Fosca Giannotti and Riccardo Guidotti and Anna Monreale and Luca Pappalardo and Salvatore Ruggieri and Franco Turini} } @article {1134, title = {Personalized Market Basket Prediction with Temporal Annotated Recurring Sequences}, journal = {IEEE Transactions on Knowledge and Data Engineering}, year = {2018}, abstract = {Nowadays, a hot challenge for supermarket chains is to offer personalized services to their customers. Market basket prediction, i.e., supplying the customer a shopping list for the next purchase according to her current needs, is one of these services. Current approaches are not capable of capturing at the same time the different factors influencing the customer{\textquoteright}s decision process: co-occurrence, sequentuality, periodicity and recurrency of the purchased items. To this aim, we define a pattern Temporal Annotated Recurring Sequence (TARS) able to capture simultaneously and adaptively all these factors. We define the method to extract TARS and develop a predictor for next basket named TBP (TARS Based Predictor) that, on top of TARS, is able to understand the level of the customer{\textquoteright}s stocks and recommend the set of most necessary items. By adopting the TBP the supermarket chains could crop tailored suggestions for each individual customer which in turn could effectively speed up their shopping sessions. A deep experimentation shows that TARS are able to explain the customer purchase behavior, and that TBP outperforms the state-of-the-art competitors.}, doi = {10.1109/TKDE.2018.2872587}, url = {https://ieeexplore.ieee.org/abstract/document/8477157}, author = {Riccardo Guidotti and Giulio Rossetti and Luca Pappalardo and Fosca Giannotti and Dino Pedreschi} } @conference {1291, title = {Weak nodes detection in urban transport systems: Planning for resilience in Singapore}, booktitle = {2018 IEEE 5th international conference on data science and advanced analytics (DSAA)}, year = {2018}, publisher = {IEEE}, organization = {IEEE}, abstract = {The availability of massive data-sets describing human mobility offers the possibility to design simulation tools to monitor and improve the resilience of transport systems in response to traumatic events such as natural and man-made disasters (e.g., floods, terrorist attacks, etc. . . ). In this perspective, we propose ACHILLES, an application to models people{\textquoteright}s movements in a given transport mode through a multiplex network representation based on mobility data. ACHILLES is a web-based application which provides an easy-to-use interface to explore the mobility fluxes and the connectivity of every urban zone in a city, as well as to visualize changes in the transport system resulting from the addition or removal of transport modes, urban zones, and single stops. Notably, our application allows the user to assess the overall resilience of the transport network by identifying its weakest node, i.e. Urban Achilles Heel, with reference to the ancient Greek mythology. To demonstrate the impact of ACHILLES for humanitarian aid we consider its application to a real-world scenario by exploring human mobility in Singapore in response to flood prevention.}, doi = {10.1109/DSAA.2018.00061}, url = {https://ieeexplore.ieee.org/abstract/document/8631413/authors$\#$authors}, author = {Ferretti, Michele and Barlacchi, Gianni and Luca Pappalardo and Lucchini, Lorenzo and Lepri, Bruno} } @conference {1198, title = {Assessing Privacy Risk in Retail Data}, booktitle = {Personal Analytics and Privacy. An Individual and Collective Perspective - First International Workshop, PAP 2017, Held in Conjunction with ECML PKDD 2017, Skopje, Macedonia, September 18, 2017, Revised Selected Papers}, year = {2017}, abstract = {Retail data are one of the most requested commodities by commercial companies. Unfortunately, from this data it is possible to retrieve highly sensitive information about individuals. Thus, there exists the need for accurate individual privacy risk evaluation. In this paper, we propose a methodology for assessing privacy risk in retail data. We define the data formats for representing retail data, the privacy framework for calculating privacy risk and some possible privacy attacks for this kind of data. We perform experiments in a real-world retail dataset, and show the distribution of privacy risk for the various attacks.}, doi = {10.1007/978-3-319-71970-2_3}, url = {https://doi.org/10.1007/978-3-319-71970-2_3}, author = {Roberto Pellungrini and Francesca Pratesi and Luca Pappalardo} } @article {1013, title = {A Data Mining Approach to Assess Privacy Risk in Human Mobility Data}, journal = {ACM Trans. Intell. Syst. Technol.}, volume = {9}, number = {3}, year = {2017}, pages = {31:1{\textendash}31:27}, abstract = {Human mobility data are an important proxy to understand human mobility dynamics, develop analytical services, and design mathematical models for simulation and what-if analysis. Unfortunately mobility data are very sensitive since they may enable the re-identification of individuals in a database. Existing frameworks for privacy risk assessment provide data providers with tools to control and mitigate privacy risks, but they suffer two main shortcomings: (i) they have a high computational complexity; (ii) the privacy risk must be recomputed every time new data records become available and for every selection of individuals, geographic areas, or time windows. In this article, we propose a fast and flexible approach to estimate privacy risk in human mobility data. The idea is to train classifiers to capture the relation between individual mobility patterns and the level of privacy risk of individuals. We show the effectiveness of our approach by an extensive experiment on real-world GPS data in two urban areas and investigate the relations between human mobility patterns and the privacy risk of individuals.}, issn = {2157-6904}, doi = {10.1145/3106774}, url = {http://doi.acm.org/10.1145/3106774}, author = {Roberto Pellungrini and Luca Pappalardo and Francesca Pratesi and Anna Monreale} } @article {1023, title = {Data-driven generation of spatio-temporal routines in human mobility}, journal = {Data Mining and Knowledge Discovery}, year = {2017}, month = {Dec}, abstract = {The generation of realistic spatio-temporal trajectories of human mobility is of fundamental importance in a wide range of applications, such as the developing of protocols for mobile ad-hoc networks or what-if analysis in urban ecosystems. Current generative algorithms fail in accurately reproducing the individuals{\textquoteright} recurrent schedules and at the same time in accounting for the possibility that individuals may break the routine during periods of variable duration. In this article we present Ditras (DIary-based TRAjectory Simulator), a framework to simulate the spatio-temporal patterns of human mobility. Ditras operates in two steps: the generation of a mobility diary and the translation of the mobility diary into a mobility trajectory. We propose a data-driven algorithm which constructs a diary generator from real data, capturing the tendency of individuals to follow or break their routine. We also propose a trajectory generator based on the concept of preferential exploration and preferential return. We instantiate Ditras with the proposed diary and trajectory generators and compare the resulting algorithm with real data and synthetic data produced by other generative algorithms, built by instantiating Ditras with several combinations of diary and trajectory generators. We show that the proposed algorithm reproduces the statistical properties of real trajectories in the most accurate way, making a step forward the understanding of the origin of the spatio-temporal patterns of human mobility.}, issn = {1573-756X}, doi = {10.1007/s10618-017-0548-4}, url = {https://doi.org/10.1007/s10618-017-0548-4}, author = {Luca Pappalardo and Filippo Simini} } @booklet {993, title = {Fast Estimation of Privacy Risk in Human Mobility Data}, year = {2017}, abstract = {Mobility data are an important proxy to understand the patterns of human movements, develop analytical services and design models for simulation and prediction of human dynamics. Unfortunately mobility data are also very sensitive, since they may contain personal information about the individuals involved. Existing frameworks for privacy risk assessment enable the data providers to quantify and mitigate privacy risks, but they suffer two main limitations: (i) they have a high computational complexity; (ii) the privacy risk must be re-computed for each new set of individuals, geographic areas or time windows. In this paper we explore a fast and flexible solution to estimate privacy risk in human mobility data, using predictive models to capture the relation between an individual{\textquoteright}s mobility patterns and her privacy risk. We show the effectiveness of our approach by experimentation on a real-world GPS dataset and provide a comparison with traditional methods. }, isbn = {978-3-319-66283-1}, doi = {10.1007/978-3-319-66284-8_35 }, author = {Roberto Pellungrini and Luca Pappalardo and Francesca Pratesi and Anna Monreale} } @conference {1024, title = {Market Basket Prediction using User-Centric Temporal Annotated Recurring Sequences}, booktitle = {2017 IEEE International Conference on Data Mining (ICDM)}, year = {2017}, publisher = {IEEE}, organization = {IEEE}, abstract = {Nowadays, a hot challenge for supermarket chains is to offer personalized services to their customers. Market basket prediction, i.e., supplying the customer a shopping list for the next purchase according to her current needs, is one of these services. Current approaches are not capable of capturing at the same time the different factors influencing the customer{\textquoteright}s decision process: co-occurrence, sequentuality, periodicity and recurrency of the purchased items. To this aim, we define a pattern named Temporal Annotated Recurring Sequence (TARS). We define the method to extract TARS and develop a predictor for next basket named TBP (TARS Based Predictor) that, on top of TARS, is able to understand the level of the customer{\textquoteright}s stocks and recommend the set of most necessary items. A deep experimentation shows that TARS can explain the customers{\textquoteright} purchase behavior, and that TBP outperforms the state-of-the-art competitors.}, author = {Riccardo Guidotti and Giulio Rossetti and Luca Pappalardo and Fosca Giannotti and Dino Pedreschi} } @article {957, title = {Next Basket Prediction using Recurring Sequential Patterns}, journal = {arXiv preprint arXiv:1702.07158}, year = {2017}, abstract = {Nowadays, a hot challenge for supermarket chains is to offer personalized services for their customers. Next basket prediction, i.e., supplying the customer a shopping list for the next purchase according to her current needs, is one of these services. Current approaches are not capable to capture at the same time the different factors influencing the customer{\textquoteright}s decision process: co-occurrency, sequentuality, periodicity and recurrency of the purchased items. To this aim, we define a pattern Temporal Annotated Recurring Sequence (TARS) able to capture simultaneously and adaptively all these factors. We define the method to extract TARS and develop a predictor for next basket named TBP (TARS Based Predictor) that, on top of TARS, is able to to understand the level of the customer{\textquoteright}s stocks and recommend the set of most necessary items. By adopting the TBP the supermarket chains could crop tailored suggestions for each individual customer which in turn could effectively speed up their shopping sessions. A deep experimentation shows that TARS are able to explain the customer purchase behavior, and that TBP outperforms the state-of-the-art competitors.}, url = {https://arxiv.org/abs/1702.07158}, author = {Riccardo Guidotti and Giulio Rossetti and Luca Pappalardo and Fosca Giannotti and Dino Pedreschi} } @article {1012, title = {Quantifying the relation between performance and success in soccer}, journal = {Advances in Complex Systems}, year = {2017}, pages = {1750014}, abstract = {The availability of massive data about sports activities offers nowadays the opportunity to quantify the relation between performance and success. In this study, we analyze more than 6000 games and 10 million events in six European leagues and investigate this relation in soccer competitions. We discover that a team{\textquoteright}s position in a competition{\textquoteright}s final ranking is significantly related to its typical performance, as described by a set of technical features extracted from the soccer data. Moreover, we find that, while victory and defeats can be explained by the team{\textquoteright}s performance during a game, it is difficult to detect draws by using a machine learning approach. We then simulate the outcomes of an entire season of each league only relying on technical data and exploiting a machine learning model trained on data from past seasons. The simulation produces a team ranking which is similar to the actual ranking, suggesting that a complex systems{\textquoteright} view on soccer has the potential of revealing hidden patterns regarding the relation between performance and success.}, doi = {10.1142/S021952591750014X}, url = {http://www.worldscientific.com/doi/abs/10.1142/S021952591750014X}, author = {Luca Pappalardo and Paolo Cintia} } @article {954, title = {Tiles: an online algorithm for community discovery in dynamic social networks}, journal = {Machine Learning}, volume = {106}, number = {8}, year = {2017}, pages = {1213{\textendash}1241}, abstract = {Community discovery has emerged during the last decade as one of the most challenging problems in social network analysis. Many algorithms have been proposed to find communities on static networks, i.e. networks which do not change in time. However, social networks are dynamic realities (e.g. call graphs, online social networks): in such scenarios static community discovery fails to identify a partition of the graph that is semantically consistent with the temporal information expressed by the data. In this work we propose Tiles, an algorithm that extracts overlapping communities and tracks their evolution in time following an online iterative procedure. Our algorithm operates following a domino effect strategy, dynamically recomputing nodes community memberships whenever a new interaction takes place. We compare Tiles with state-of-the-art community detection algorithms on both synthetic and real world networks having annotated community structure: our experiments show that the proposed approach is able to guarantee lower execution times and better correspondence with the ground truth communities than its competitors. Moreover, we illustrate the specifics of the proposed approach by discussing the properties of identified communities it is able to identify.}, doi = {10.1007/s10994-016-5582-8}, url = {https://link.springer.com/article/10.1007/s10994-016-5582-8}, author = {Giulio Rossetti and Luca Pappalardo and Dino Pedreschi and Fosca Giannotti} } @article {961, title = {An analytical framework to nowcast well-being using mobile phone data}, journal = {International Journal of Data Science and Analytics}, volume = {2}, number = {1-2}, year = {2016}, pages = {75{\textendash}92}, abstract = {An intriguing open question is whether measurements derived from Big Data recording human activities can yield high-fidelity proxies of socio-economic development and well-being. Can we monitor and predict the socio-economic development of a territory just by observing the behavior of its inhabitants through the lens of Big Data? In this paper, we design a data-driven analytical framework that uses mobility measures and social measures extracted from mobile phone data to estimate indicators for socio-economic development and well-being. We discover that the diversity of mobility, defined in terms of entropy of the individual users{\textquoteright} trajectories, exhibits (i) significant correlation with two different socio-economic indicators and (ii) the highest importance in predictive models built to predict the socio-economic indicators. Our analytical framework opens an interesting perspective to study human behavior through the lens of Big Data by means of new statistical indicators that quantify and possibly {\textquotedblleft}nowcast{\textquotedblright} the well-being and the socio-economic development of a territory.}, doi = {10.1007/s41060-016-0013-2}, author = {Luca Pappalardo and Maarten Vanhoof and Lorenzo Gabrielli and Zbigniew Smoreda and Dino Pedreschi and Fosca Giannotti} } @article {960, title = {Homophilic network decomposition: a community-centric analysis of online social services}, journal = {Social Network Analysis and Mining}, volume = {6}, number = {1}, year = {2016}, pages = {103}, abstract = {In this paper we formulate the homophilic network decomposition problem: Is it possible to identify a network partition whose structure is able to characterize the degree of homophily of its nodes? The aim of our work is to understand the relations between the homophily of individuals and the topological features expressed by specific network substructures. We apply several community detection algorithms on three large-scale online social networks{\textemdash}Skype, LastFM and Google+{\textemdash}and advocate the need of identifying the right algorithm for each specific network in order to extract a homophilic network decomposition. Our results show clear relations between the topological features of communities and the degree of homophily of their nodes in three online social scenarios: product engagement in the Skype network, number of listened songs on LastFM and homogeneous level of education among users of Google+.}, doi = {10.1007/s1327}, author = {Giulio Rossetti and Luca Pappalardo and Riivo Kikas and Dino Pedreschi and Fosca Giannotti and Marlon Dumas} } @conference {822, title = {A novel approach to evaluate community detection algorithms on ground truth}, booktitle = {7th Workshop on Complex Networks}, year = {2016}, publisher = {Springer-Verlag}, organization = {Springer-Verlag}, address = {Dijon, France}, abstract = {Evaluating a community detection algorithm is a complex task due to the lack of a shared and universally accepted definition of community. In literature, one of the most common way to assess the performances of a community detection algorithm is to compare its output with given ground truth communities by using computationally expensive metrics (i.e., Normalized Mutual Information). In this paper we propose a novel approach aimed at evaluating the adherence of a community partition to the ground truth: our methodology provides more information than the state-of-the-art ones and is fast to compute on large-scale networks. We evaluate its correctness by applying it to six popular community detection algorithms on four large-scale network datasets. Experimental results show how our approach allows to easily evaluate the obtained communities on the ground truth and to characterize the quality of community detection algorithms.}, doi = {10.1007/978-3-319-30569-1_10}, url = {http://www.giuliorossetti.net/about/wp-content/uploads/2015/12/Complenet16.pdf}, author = {Giulio Rossetti and Luca Pappalardo and S Rinzivillo} } @conference {819, title = {Community-centric analysis of user engagement in Skype social network}, booktitle = {International conference on Advances in Social Network Analysis and Mining}, year = {2015}, publisher = {IEEE}, organization = {IEEE}, address = {Paris, France}, isbn = {978-1-4503-3854-7}, doi = {10.1145/2808797.2809384}, url = {http://dl.acm.org/citation.cfm?doid=2808797.2809384}, author = {Giulio Rossetti and Luca Pappalardo and Riivo Kikas and Dino Pedreschi and Fosca Giannotti and Marlon Dumas} } @proceedings {770, title = {The harsh rule of the goals: data-driven performance indicators for football teams}, year = {2015}, abstract = {{\textemdash}Sports analytics in general, and football (soccer in USA) analytics in particular, have evolved in recent years in an amazing way, thanks to automated or semi-automated sensing technologies that provide high-fidelity data streams extracted from every game. In this paper we propose a data-driven approach and show that there is a large potential to boost the understanding of football team performance. From observational data of football games we extract a set of pass-based performance indicators and summarize them in the H indicator. We observe a strong correlation among the proposed indicator and the success of a team, and therefore perform a simulation on the four major European championships (78 teams, almost 1500 games). The outcome of each game in the championship was replaced by a synthetic outcome (win, loss or draw) based on the performance indicators computed for each team. We found that the final rankings in the simulated championships are very close to the actual rankings in the real championships, and show that teams with high ranking error show extreme values of a defense/attack efficiency measure, the Pezzali score. Our results are surprising given the simplicity of the proposed indicators, suggesting that a complex systems{\textquoteright} view on football data has the potential of revealing hidden patterns and behavior of superior quality.}, url = {https://www.researchgate.net/profile/Luca_Pappalardo/publication/281318318_The_harsh_rule_of_the_goals_data-driven_performance_indicators_for_football_teams/links/561668e308ae37cfe4090a5d.pdf}, author = {Paolo Cintia and Luca Pappalardo and Dino Pedreschi and Fosca Giannotti and Marco Malvaldi} } @article {723, title = {Returners and explorers dichotomy in human mobility}, journal = {Nat Commun}, volume = {6}, year = {2015}, month = {09}, abstract = {The availability of massive digital traces of human whereabouts has offered a series of novel insights on the quantitative patterns characterizing human mobility. In particular, numerous recent studies have lead to an unexpected consensus: the considerable variability in the characteristic travelled distance of individuals coexists with a high degree of predictability of their future locations. Here we shed light on this surprising coexistence by systematically investigating the impact of recurrent mobility on the characteristic distance travelled by individuals. Using both mobile phone and GPS data, we discover the existence of two distinct classes of individuals: returners and explorers. As existing models of human mobility cannot explain the existence of these two classes, we develop more realistic models able to capture the empirical findings. Finally, we show that returners and explorers play a distinct quantifiable role in spreading phenomena and that a correlation exists between their mobility patterns and social interactions.}, url = {http://dx.doi.org/10.1038/ncomms9166}, author = {Luca Pappalardo and Filippo Simini and S Rinzivillo and Dino Pedreschi and Fosca Giannotti and Barabasi, Albert-Laszlo} } @article {724, title = {Small Area Model-Based Estimators Using Big Data Sources}, journal = {Journal of Official Statistics}, volume = {31}, number = {2}, year = {2015}, pages = {263{\textendash}281}, author = {Stefano Marchetti and Caterina Giusti and Monica Pratesi and Nicola Salvati and Fosca Giannotti and Dino Pedreschi and S Rinzivillo and Luca Pappalardo and Lorenzo Gabrielli} } @conference {727, title = {Mining efficient training patterns of non-professional cyclists}, booktitle = {22nd Italian Symposium on Advanced Database Systems, {SEBD} 2014, Sorrento Coast, Italy, June 16-18, 2014.}, year = {2014}, author = {Paolo Cintia and Luca Pappalardo and Dino Pedreschi} } @conference {623, title = {The patterns of musical influence on the Last.Fm social network}, booktitle = {22nd Italian Symposium on Advanced Database Systems, {SEBD} 2014, Sorrento Coast, Italy, June 16-18, 2014.}, year = {2014}, author = {Diego Pennacchioli and Giulio Rossetti and Luca Pappalardo and Dino Pedreschi and Fosca Giannotti and Michele Coscia} } @conference {725, title = {The purpose of motion: Learning activities from Individual Mobility Networks}, booktitle = {International Conference on Data Science and Advanced Analytics, {DSAA} 2014, Shanghai, China, October 30 - November 1, 2014}, year = {2014}, doi = {10.1109/DSAA.2014.7058090}, url = {http://dx.doi.org/10.1109/DSAA.2014.7058090}, author = {S Rinzivillo and Lorenzo Gabrielli and Mirco Nanni and Luca Pappalardo and Dino Pedreschi and Fosca Giannotti} } @conference {731, title = {Comparing General Mobility and Mobility by Car}, booktitle = {Computational Intelligence and 11th Brazilian Congress on Computational Intelligence (BRICS-CCI CBIC), 2013 BRICS Congress on}, year = {2013}, month = {Sept}, doi = {10.1109/BRICS-CCI-CBIC.2013.116}, author = {Luca Pappalardo and Filippo Simini and S Rinzivillo and Dino Pedreschi and Fosca Giannotti} } @conference {729, title = {"Engine Matters": {A} First Large Scale Data Driven Study on Cyclists{\textquoteright} Performance}, booktitle = {13th {IEEE} International Conference on Data Mining Workshops, {ICDM} Workshops, TX, USA, December 7-10, 2013}, year = {2013}, doi = {10.1109/ICDMW.2013.41}, url = {http://dx.doi.org/10.1109/ICDMW.2013.41}, author = {Paolo Cintia and Luca Pappalardo and Dino Pedreschi} } @conference {504, title = {Measuring tie strength in multidimensional networks}, booktitle = {SEDB 2013}, year = {2013}, month = {2013}, author = {Giulio Rossetti and Luca Pappalardo and Dino Pedreschi} } @conference {624, title = {The Three Dimensions of Social Prominence}, booktitle = {Social Informatics - 5th International Conference, SocInfo 2013, Kyoto, Japan, November 25-27, 2013, Proceedings}, year = {2013}, doi = {10.1007/978-3-319-03260-3_28}, url = {http://dx.doi.org/10.1007/978-3-319-03260-3_28}, author = {Diego Pennacchioli and Giulio Rossetti and Luca Pappalardo and Dino Pedreschi and Fosca Giannotti and Michele Coscia} } @article {732, title = {{Understanding the patterns of car travel}}, journal = {The European Physical Journal Special Topics}, volume = {215}, number = {1}, year = {2013}, pages = {61{\textendash}73}, abstract = {{Are the patterns of car travel different from those of general human mobility? Based on a unique dataset consisting of the GPS trajectories of 10 million travels accomplished by 150,000 cars in Italy, we investigate how known mobility models apply to car travels, and illustrate novel analytical findings. We also assess to what extent the sample in our dataset is representative of the overall car mobility, and discover how to build an extremely accurate model that, given our GPS data, estimates the real traffic values as measured by road sensors.}}, doi = {10.1140/epjst\%252fe2013-01715-5}, url = {http://dx.doi.org/10.1140/epjst\%252fe2013-01715-5}, author = {Luca Pappalardo and S Rinzivillo and Qu, Zehui and Dino Pedreschi and Fosca Giannotti} } @article {488, title = {Analisi di Mobilita{\textquoteright} con dati eterogenei}, year = {2012}, institution = {ISTI - CNR}, address = {Pisa}, author = {Barbara Furletti and Roberto Trasarti and Lorenzo Gabrielli and S Rinzivillo and Luca Pappalardo and Fosca Giannotti} } @conference {626, title = {"How Well Do We Know Each Other?" Detecting Tie Strength in Multidimensional Social Networks}, booktitle = {International Conference on Advances in Social Networks Analysis and Mining, {ASONAM} 2012, Istanbul, Turkey, 26-29 August 2012}, year = {2012}, doi = {10.1109/ASONAM.2012.180}, url = {http://doi.ieeecomputersociety.org/10.1109/ASONAM.2012.180}, author = {Luca Pappalardo and Giulio Rossetti and Dino Pedreschi} }