@article{LamMelMil99-InfSciences99-IJ, author = {Evelina ~Lamma AND Paola ~Mello AND Michela ~Milano AND Fabrizio ~Riguzzi}, title = {Integrating Induction and Abduction in Logic Programming}, journal = {Information Sciences}, pages = {25--54}, volume = {116}, number = {1}, year = 1999, month = may, abstract = {We propose an approach for the integration of abduction and induction in Logic Programming. We define an Abductive Learning Problem as an extended Inductive Logic Programming problem where both the background and target theories are abductive theories and where abductive derivability is used as the coverage relation instead of deductive derivability. The two main benefits of this integration are the possibility of learning in presence of incomplete knowledge and the increased expressive power of the background and target theories. We present the system LAP (Learning Abductive Programs) that is able to solve this extended learning problem and we describe, by means of examples, four different learning tasks that can be performed by the system: learning from incomplete knowledge, learning rules with exceptions, learning from integrity constraints and learning recursive predicates.}, keywords = {Abduction, Negation, Integrity Constraints}, publisher = {Elsevier Science}, address = {Amsterdam, \TheNetherlands}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/LamMelMil-IS99.pdf}, doi = {10.1016/S0020-0255(98)10092-0}, url = {http://www.sciencedirect.com/science/article/pii/S0020025598100920}, copyright = {Elsevier} }

@article{LamPerRig00-ML-IJ, author = {Evelina Lamma and Fabrizio Riguzzi and Lu\'{i}s Moniz Pereira}, title = {Strategies in Combined Learning via Logic Programs}, journal = {Machine Learning}, volume = {38}, number = {1/2}, year = {2000}, month = {January/February}, pages = {63--87}, keywords = {ILP Implementation,ILP Theory,Knowledge Representation,Negation}, abstract = {We discuss the adoption of a three-valued setting for inductive concept learning. Distinguishing between what is true, what is false and what is unknown can be useful in situations where decisions have to be taken on the basis of scarce, ambiguous, or downright contradictory information. In a three-valued setting, we learn a definition for both the target concept and its opposite, considering positive and negative examples as instances of two disjoint classes. To this purpose, we adopt Extended Logic Programs (ELP) under a Well-Founded Semantics with explicit negation WFSX as the representation formalism for learning, and show how ELPs can be used to specify combinations of strategies in a declarative way also coping with contradiction and exceptions. Explicit negation is used to represent the opposite concept, while default negation is used to ensure consistency and to handle exceptions to general rules. Exceptions are represented by examples covered by the definition for a concept that belong to the training set for the opposite concept. Standard Inductive Logic Programming techniques are employed to learn the concept and its opposite. Depending on the adopted technique, we can learn the most general or the least general definition. Thus, four epistemological varieties occur, resulting from the combination of most general and least general solutions for the positive and negative concept. We discuss the factors that should be taken into account when choosing and strategically combining the generality levels for positive and negative concepts. In the paper, we also handle the issue of strategic combination of possibly contradictory learnt definitions of a predicate and its explicit negation. All in all, we show that extended logic programs under well-founded semantics with explicit negation add expressivity to learning tasks, and allow the tackling of a number of representation and strategic issues in a principled way. Our techniques have been implemented and examples run on a state-of-the-art logic programming system with tabling which implements WFSX.}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/LamRigPer-ML00.pdf}, publisher = {Springer Netherlands}, address = {Dordrecht, \TheNetherlands}, doi = {10.1023/A:1007681906490}, http = {http://link.springer.com/article/10.1023%2FA%3A1007681906490}, copyright = {Springer Netherlands}, note = {The original publication is available at \url{http://www.springerlink.com}} }

@article{KakRig00-NGC-IJ, author = {Antonis C. Kakas AND Fabrizio Riguzzi}, title = {Abductive Concept Learning}, journal = {New Generation Computing}, volume = {18}, number = {3}, year = {2000}, pages = {243--294}, keywords = {Abduction, Integrity Constraints, Multiple Predicate Learning}, address = {Tokyo, \Japan}, month = may, publisher = {Ohmsha, Ltd. and Springer}, abstract = {We investigate how abduction and induction can be integrated into a common learning framework. In particular, we consider an extension of Inductive Logic Programming (ILP) for the case in which both the background and the target theories are abductive logic programs and where an abductive notion of entailment is used as the basic coverage relation for learning. This extended learning framework has been called Abductive Concept Learning (ACL). In this framework, it is possible to learn with incomplete background information about the training examples by exploiting the hypothetical reasoning of abduction. We also study how the ACL framework can be used as a basis for multiple predicate learning. An algorithm for ACL is developed by suitably extending the top-down ILP method: the deductive proof procedure of Logic Programming is replaced by an abductive proof procedure for Abductive Logic Programming. This algorithm also incorporates a phase for learning integrity constraints by suitably employing a system that learns from interpretations like ICL. The framework of ACL thus integrates the two ILP settings of explanatory (predictive) learning and confirmatory (descriptive) learning. The above algorithm has been implemented into a system also called ACL\footnote{The learning systems developed in this work together with sample experimental data can be found at the following address: {\tt http://www-lia.deis.unibo.it/Software/ACL/}} Several experiments have been performed that show the effectiveness of the ACL framework in learning from incomplete data and its appropriate use for multiple predicate learning.}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/KakRIg-NGC00.pdf}, http = {http://link.springer.com/article/10.1007%2FBF03037531}, doi = {10.1007/BF03037531}, copyright = {Ohmsha, Ltd. and Springer} }

@article{CucMelPic01-IDA-IJ, author = {Rita Cucchiara and Paola Mello and Massimo Piccardi and Fabrizio Riguzzi}, title = {An Application of Machine Learning and Statistics to Defect Detection}, journal = {Intelligent Data Analysis}, year = {2001}, volume = {5}, number = {2}, pages = {151--164}, publisher = {{IOS} Press}, address = {Amsterdam, \TheNetherlands}, month = {March/April}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/CucMelPic-IDA01.pdf}, doi = {10.3233/IDA-2001-5205}, copyright = {Rita Cucchiara, Paola Mello, Massimo Piccardi, Fabrizio Riguzzi, exclusively licensed to {IOS} Press} }

@article{LamMaeMel01-ENTCS-IJ, author = {Evelina Lamma and Leonardo Maestrami and Paola Mello and Fabrizio Riguzzi and Sergio Storari}, title = {Rule-based Programming for Building Expert Systems: a Comparison in the Microbiological Data Validation and Surveillance Domain}, journal = {Electronic Notes in Theoretical Computer Science}, volume = {59}, issue = {4}, publisher = {Elsevier Science Publishers}, editor = {Mark van den Brand and Rakesh Verma}, year = {2001}, address = {Amsterdam, \TheNetherlands}, doi = {10.1016/S1571-0661(04)00299-3}, url = {http://www.sciencedirect.com/science/article/pii/S1571066104002993}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/LamMaeMel-ENTCS01.pdf}, month = sep, abstract = {In this work, we compare three rule-based programming tools used for building an expert system for microbiological laboratory data validation and bacteria infections monitoring. The first prototype of the system was implemented in KAPPA-PC. We report on the implementation and performance by comparing KAPPA-PC with two other more recent tools, namely JESS and ILOG JRULES. In order to test each tool we realized three simple test applications capable to perform some tasks that are peculiar of our expert system.}, keywords = {Expert Systems, Knowledge-based Systems, Microbiology} }

@article{LamMelRig03-NGC-IJ, author = {Evelina Lamma and Fabrizio Riguzzi and Sergio Storari and Paola Mello and Annamaria Nanetti}, title = {Discovering Validation Rules from Micro-biological Data}, journal = {New Generation Computing}, year = {2003}, volume = {21}, number = {2}, pages = {123--134}, publisher = {Ohmsha, Ltd. and Springer}, address = {Tokyo, \Japan}, month = feb, pdf = {http://ml.unife.it/wp-content/uploads/Papers/LamRigStoMelNan-NGC03.pdf}, http = {http://www.springerlink.com/content/b816tm18j5715810}, doi = {10.1007/BF03037630}, copyright = {Ohmsha, Ltd. and Springer}, abstract = {A huge amount of data is daily collected from clinical mi- crobiology laboratories. These data concern the resistance or susceptibil- ity of bacteria to tested antibiotics. Almost all microbiology laboratories follow standard antibiotic testing guidelines which suggest antibiotic test execution methods and result interpretation and validation (among them, those annually published by NCCLS). Guidelines basically specify, for each species, the antibiotics to be tested, how to interpret the results of tests and a list of exceptions regarding particular antibiotic test results. Even if these standards are quite assessed, they do not consider pecu- liar features of a given hospital laboratory, which possibly influence the antimicrobial test results, and the further validation process. In order to improve and better tailor the validation process, we have applied knowledge discovery techniques, and data mining in particular, to microbiological data with the purpose of discovering new validation rules, not yet included in NCCLS guidelines, but considered plausible and correct by interviewed experts. In particular, we applied the knowledge discovery process in order to find (association) rules relating to each other the susceptibility or resistance of a bacterium to different antibiotics. This approach is not antithetic, but complementary to that based on NCCLS rules: it proved very effective in validating some of them, and also in extending that compendium. In this respect, the new discovered knowledge has lead microbiologists to be aware of new correlations among some antimicrobial test results, which were previously unnoticed. Last but not least, the new discovered rules, taking into account the history of the considered laboratory, are better tailored to the hospital situation, and this is very important since some resistances to antibiotics are specific to particular, local hospital environments.}, keywords = {Knowledge Discovery and Data mining, Microbiology, Knowledge Based Systems, Knowledge Elicitation} }

@article{LamRigPer03-NGC-IJ, author = {Evelina Lamma and Fabrizio Riguzzi and Lu\'\i{}s Moniz Pereira}, title = {Belief Revision via {L}amarckian Evolution}, journal = {New Generation Computing}, abstract = {We present a system for performing belief revision in a multi-agent environment. The system is called GBR (Genetic Belief Revisor) and it is based on a genetic algorithm. In this setting, different individuals are exposed to different experiences. This may happen because the world surrounding an agent changes over time or because we allow agents exploring different parts of the world. The algorithm permits the exchange of chromosomes from different agents and combines two different evolution strategies, one based on Darwin's and the other on Lamarck's evolutionary theory. The algorithm therefore includes also a Lamarckian operator that changes the memes of an agent in order to improve their fitness. The operator is implemented by means of a belief revision procedure that, by tracing logical derivations, identifies the memes leading to contradiction. Moreover, the algorithm comprises a special crossover mechanism for memes in which a meme can be acquired from another agent only if the other agent has ``accessed'' the meme, i.e. if an application of the Lamarckian operator has read or modified the meme. Experiments have been performed on the $n$-queen problem and on a problem of digital circuit diagnosis. In the case of the $n$-queen problem, the addition of the Lamarckian operator in the single agent case improves the fitness of the best solution. In both cases the experiments show that the distribution of constraints, even if it may lead to a reduction of the fitness of the best solution, does not produce a significant reduction.}, publisher = {Ohmsha, Ltd. and Springer}, address = {Tokyo, \Japan}, keywords = {Genetic_Algorithms,Theory_Revision}, year = {2003}, volume = {21}, number = {3}, month = aug, pages = {247--275}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/LamRigPer-NGC03.pdf}, http = {http://www.springerlink.com/content/063764w6n3847825/}, doi = {10.1007/BF03037475}, copyright = {Ohmsha, Ltd. and Springer} }

@article{LamMelRig04-CJ-IJ, author = {Evelina Lamma and Paola Mello and Fabrizio Riguzzi}, title = {A System for Measuring Function Points from an {ER}-{DFD} Specification}, journal = {The Computer Journal}, abstract = {We present a tool for measuring the Function Point software metric from the specification of a software system expressed in the form of an Entity Relationship diagram plus a Data Flow Diagram (ER-DFD). First, the informal and general Function Point counting rules are translated into rigorous rules expressing properties of the ER-DFD. Then, the rigorous rules are translated into Prolog. The measures given by the system on a number of case studies are in accordance with those of human experts.}, publisher = {Oxford University Press}, address = {Oxford, \UK}, keywords = {Software Engineering, Software Metrics, Function Points}, year = {2004}, volume = {47}, number = {3}, pages = {358--372}, month = may, pdf = {http://ml.unife.it/wp-content/uploads/Papers/fun.pdf}, issn = {0010--4620}, doi = {10.1093/comjnl/47.3.358}, copyright = {Evelina Lamma, Paola Mello and Fabrizio Riguzzi, licensed exclusively to The British Computer Society} }

@article{LamMelNan06-TITB-IJ, author = {Evelina Lamma and Paola Mello and Annamaria Nanetti and Fabrizio Riguzzi and Sergio Storari and Gianfranco Valastro}, title = {Artificial Intelligence Techniques for Monitoring Dangerous Infections}, journal = {IEEE Transaction on Information Technology in Biomedicine}, year = {2006}, publisher = {IEEE Computer Society Press}, address = {Washington, DC, \USA}, volume = {10}, number = {1}, pages = {143-155}, month = jan, issn = {1089-7771}, doi = {10.1109/TITB.2005.855537}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/LamMelNanRigStoVal-TITB06.pdf}, abstract = { The monitoring and detection of nosocomial infections is a very important problem arising in hospitals. A hospital-acquired or nosocomial infection is a disease that develops after the admission into the hospital and it is the consequence of a treatment, not necessarily a surgical one, performed by the medical staff. Nosocomial infections are dangerous because they are caused by bacteria which have dangerous (critical) resistance to antibiotics. This problem is very serious all over the world. In Italy, actually almost 5-8\% of the patients admitted into hospitals develop this kind of infection. In order to reduce this figure, policies for controlling infections should be adopted by medical practitioners. In order to support them in this complex task, we have developed a system, called MERCURIO, capable of managing different aspects of the problem. The objectives of this system are the validation of microbiological data and the creation of a real time epidemiological information system. The system is useful for laboratory physicians, because it supports them in the execution of the microbiological analyses; for clinicians, because it supports them in the definition of the prophylaxis, of the most suitable antibiotic therapy and in the monitoring of patients' infections, and for epidemiologists, because it allows them to identify outbreaks and to study infection dynamics. In order to achieve these objectives we have adopted expert system and data mining techniques. We have also integrated a statistical module that monitors the diffusion of nosocomial infections over time in the hospital and that strictly interacts with the knowledge based module. Data mining techniques have been used for improving the system knowledge base. The knowledge discovery process is not antithetic, but complementary to the one based on manual knowledge elicitation. In order to verify the reliability of the tasks performed by MERCURIO and the usefulness of the knowledge discovery approach, we performed a test based on a dataset of real infection events. In the validation task MERCURIO achieved an accuracy of 98.5\%, a sensitivity of 98.5\% and a specificity of 99\%. In the therapy suggestion task MERCURIO achieved very high Accuracy and Specificity as well. The executed test provided many insights to experts too (we discovered some of their mistakes). The knowledge discovery approach was very effective in validating part of MERCURIO knowledge base and also in extending it with new validation rules, confirmed by interviewed microbiologists and peculiar to the hospital laboratory under consideration.}, keywords = {Microbiology, Knowledge Based Systems, Decision Support Systems, Data Mining, Classification}, copyright = {IEEE} }

@article{Rig08-ML-IJ, author = { Fabrizio Riguzzi}, title = {{ALLPAD}: Approximate Learning of Logic Programs with Annotated Disjunctions}, journal = {Machine Learning}, note = {The original publication is available at \url{http://www.springerlink.com}}, year = {2008}, volume = {70}, number = {2-3}, month = mar, pdf = {http://ml.unife.it/wp-content/uploads/Papers/Rig-ML07.pdf}, doi = {10.1007/s10994-007-5032-8 }, abstract = {Logic Programs with Annotated Disjunctions (LPADs) provide a simple and elegant framework for representing probabilistic knowledge in logic programming. In this paper we consider the problem of learning ground LPADs starting from a set of interpretations annotated with their probability. We present the system ALLPAD for solving this problem. ALLPAD modifies the previous system LLPAD in order to tackle real world learning problems more effectively. This is achieved by looking for an approximate solution rather than a perfect one. A number of experiments have been performed on real and artificial data for evaluating ALLPAD, showing the feasibility of the approach}, keywords = {Inductive logic programming, Probabilistic logic programming, Statistical relational learning, Logic programs with annotated disjunctions}, pages = {207--223}, publisher = {Springer}, address = {Heidelberg, \Germany}, copyright = {Springer} }

@article{Rig09-LJIGPL-IJ, author = {Fabrizio Riguzzi}, title = {Extended Semantics and Inference for the {Independent Choice Logic}}, journal = {Logic Journal of the IGPL}, publisher = {Oxford University Press}, volume = {17}, number = {6}, pages = {589--629}, address = {Oxford, \UK}, year = {2009}, abstract = {The Independent Choice Logic (ICL) is a language for expressing probabilistic information in logic programming that adopts a distribution semantics: an ICL theory defines a distribution over a set of possible worlds that are normal logic programs. The probability of a query is then given by the sum of the probabilities of worlds where the query is true. The ICL semantics requires the theories to be acyclic. This is a strong limitation that rules out many interesting programs. In this paper we present an extension of the ICL semantics that allows theories to be modularly acyclic. Inference with ICL can be performed with the Cilog2 system that computes explanations to queries and then makes them mutually incompatible by means of an iterative algorithm. We propose the system PICL (for Probabilistic inference with ICL) that computes the explanations to queries by means of a modification of SLDNF\--resolution and then makes them mutually incompatible by means of Binary Decision Diagrams. PICL and Cilog2 are compared on problems that involve computing the probability of a connection between two nodes in biological graphs and social networks. PICL turned to be more efficient, handling larger networks/more complex queries in a shorter time than Cilog2. This is true both for marginal and for conditional queries. }, doi = {10.1093/jigpal/jzp025}, keywords = {Probabilistic Logic Programming, Independent Choice Logic, Modularly acyclic programs, SLDNF-Resolution}, copyright = {Fabrizio Riguzzi, exclusively licensed to Oxford University Press}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/Rig09-LJIGPL-IJ.pdf} }

@article{CheLamMel09-TOPNOC-IJ, author = {Federico Chesani and Evelina Lamma and Paola Mello and Marco Montali and Fabrizio Riguzzi and Sergio Storari}, title = {Exploiting Inductive Logic Programming Techniques for Declarative Process Mining}, journal = {LNCS Transactions on Petri Nets and Other Models of Concurrency, {ToPNoC} {II}}, year = {2009}, publisher = {Springer}, address = {Heidelberg, \Germany}, note = {The original publication is available at \url{http://www.springerlink.com}}, series = {Lecture Notes on Computer Science}, volume = {5460}, pages = {278--295}, doi = {10.1007/978-3-642-00899-3_16}, issn = {1867-7193}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/CheLamMel-TOPNOC09.pdf}, url = {http://www.springerlink.com/content/c4j2k38675588759/}, abstract = {In the last few years, there has been a growing interest in the adoption of declarative paradigms for modeling and verifying process models. These paradigms provide an abstract and human understandable way of specifying constraints that must hold among activities executions rather than focusing on a specific procedural solution. Mining such declarative descriptions is still an open challenge. In this paper, we present a logic-based approach for tackling this problem. It relies on Inductive Logic Programming techniques and, in particular, on a modified version of the Inductive Constraint Logic algorithm. We investigate how, by properly tuning the learning algorithm, the approach can be adopted to mine models expressed in the ConDec notation, a graphical language for the declarative specification of business processes. Then, we sketch how such a mining framework has been concretely implemented as a ProM plug-in called DecMiner. We finally discuss the effectiveness of the approach by means of an example which shows the ability of the language to model concurrent activities and of DecMiner to learn such a model.}, keywords = {Process Mining, Inductive Logic Programming, Declarative Process Languages}, copyright = {Springer} }

@article{StoRigLam09-IDA-IJ, author = {Sergio Storari and Fabrizio Riguzzi and Evelina Lamma}, title = {Exploiting Association and Correlation Rules Parameters for Learning Bayesian Networks}, journal = {Intelligent Data Analysis}, year = {2009}, pages = { 689--701}, publisher = {{IOS} Press}, volume = {13}, issue = {5}, address = {Amsterdam, \TheNetherlands}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/StoRigLam-IDA09.pdf}, doi = {10.3233/IDA-2009-0388}, abstract = { In data mining, association and correlation rules are inferred from data in order to highlight statistical dependencies among attributes. The metrics defined for evaluating these rules can be exploited to score relationships between attributes in Bayesian network learning. In this paper, we propose two novel methods for learning Bayesian networks from data that are based on the K2 learning algorithm and that improve it by exploiting parameters normally defined for association and correlation rules. In particular, we propose the algorithms K2-Lift and K2-$X^{2}$, that exploit the lift metric and the $X^2$ metric respectively. We compare K2\--Lift, K2-$X^{2}$ with K2 on artificial data and on three test Bayesian networks. The experiments show that both our algorithms improve K2 with respect to the quality of the learned network. Moreover, a comparison of K2\--Lift and K2-$X^{2}$ with a genetic algorithm approach on two benchmark networks show superior results on one network and comparable results on the other.}, keywords = {Bayesian Networks Learning, K2, Association Rules, Correlation Rules}, copyright = {Sergio Storari, Fabrizio Riguzzi and Evelina Lamma, exclusively licensed to {IOS} Press} }

@article{GavRigMilCag10-ICLP10-IJ, author = {Marco Gavanelli and Fabrizio Riguzzi and Michela Milano and Paolo Cagnoli}, title = {{L}ogic-{B}ased {D}ecision {S}upport for {S}trategic {E}nvironmental {A}ssessment}, year = {2010}, editor = {M.~Hermenegildo and T.~Schaub}, month = jul, journal = {Theory and Practice of Logic Programming, 26th Int'l. Conference on Logic Programming (ICLP'10) Special Issue}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/GavRigMilCag-ICLP10.pdf}, volume = {10}, number = {4-6}, publisher = {Cambridge University Press}, copyright = {Cambridge University Press}, abstract = {Strategic Environmental Assessment is a procedure aimed at introducing systematic assessment of the environmental effects of plans and programs. This procedure is based on the so called coaxial matrices that define dependencies between plan activities (infrastructures, plants, resource extractions, buildings, etc.) and positive and negative environmental impacts, and dependencies between these impacts and environmental receptors. Up to now, this procedure is manually implemented by environmental experts for checking the environmental effects of a given plan or program, but it is never applied during the plan/program construction. A decision support system, based on a clear logic semantics, would be an invaluable tool not only in assessing a single, already defined plan, but also during the planning process in order to produce an optimized, environmentally assessed plan and to study possible alternative scenarios. We propose two logic-based approaches to the problem, one based on Constraint Logic Programming and one on Probabilistic Logic Programming that could be, in the future, conveniently merged to exploit the advantages of both. We test the proposed approaches on a real energy plan and we discuss their limitations and advantages.}, keywords = {Strategic Environmental Assessment, Regional Planning, Constraint Logic Programming, Probabilistic Logic Programming, Causality}, doi = {10.1017/S1471068410000335}, pages = {643--658}, arxiv = {1007.3159} }

@article{Rig10-FI-IJ, author = {Fabrizio Riguzzi}, title = {{SLGAD} Resolution for Inference on {Logic Programs with Annotated Disjunctions}}, journal = {Fundamenta Informaticae}, abstract = {Logic Programs with Annotated Disjunctions (LPADs) allow to express probabilistic information in logic programming. The semantics of an LPAD is given in terms of well\--founded models of the normal logic programs obtained by selecting one disjunct from each ground LPAD clause. Inference on LPADs can be performed using either the system Ailog2, that was developed for the Independent Choice Logic, or SLDNFAD, an algorithm based on SLDNF. However, both of these algorithms run the risk of going into infinite loops and of performing redundant computations. In order to avoid these problems, we present SLGAD resolution that computes the (conditional) probability of a ground query from a range\--restricted LPAD and is based on SLG resolution for normal logic programs. As SLG, it uses tabling to avoid some infinite loops and to avoid redundant computations. The performances of SLGAD are evaluated on classical benchmarks for normal logic programs under the well\--founded semantics, namely a 2\--person game and the ancestor relation, and on a game of dice. SLGAD is compared with Ailog2 and SLDNFAD on the problems in which they do not go into infinite loops, namely those that are described by a modularly acyclic program. On the 2\--person game and the ancestor relation, SLGAD is more expensive than SLDNFAD on problems where SLDNFAD succeeds but is faster than Ailog2 when the query is true in an exponential number of instances. If the program requires the repeated computation of similar goals, as for the dice game, then SLGAD outperforms both Ailog2 and SLDNFAD.}, keywords = {Probabilistic Logic Programming, Well-Founded Semantics, Logic Programs with Annotated Disjunctions, SLG Resolution}, month = oct, volume = {102}, number = {3-4}, year = {2010}, pages = {429--466}, doi = {10.3233/FI-2010-392}, publisher = {{IOS} Press}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/Rig10-FI-IJ.pdf}, scopus = {2-s2.0-78650327867}, isi = {WOS:000284311600008} }

@article{RigSwi11-ICLP11-IJ, author = {Fabrizio Riguzzi and Terrance Swift}, title = {The {PITA} System: Tabling and Answer Subsumption for Reasoning under Uncertainty}, year = {2011}, journal = {Theory and Practice of Logic Programming, 27th International Conference on Logic Programming (ICLP'11) Special Issue, Lexington, Kentucky 6-10 July 2011}, editor = {John Gallagher and Michael Gelfond}, volume = {11}, number = {4--5}, publisher = {Cambridge University Press}, copyright = {Cambridge University Press}, abstract = {Many real world domains require the representation of a measure of uncertainty. The most common such representation is probability, and the combination of probability with logic programs has given rise to the field of Probabilistic Logic Programming (PLP), leading to languages such as the Independent Choice Logic, Logic Programs with Annotated Disjunctions (LPADs), Problog, PRISM and others. These languages share a similar distribution semantics, and methods have been devised to translate programs between these languages. The complexity of computing the probability of queries to these general PLP programs is very high due to the need to combine the probabilities of explanations that may not be exclusive. As one alternative, the PRISM system reduces the complexity of query answering by restricting the form of programs it can evaluate. As an entirely different alternative, Possibilistic Logic Programs adopt a simpler metric of uncertainty than probability. Each of these approaches -- general PLP, restricted PLP, and Possibilistic Logic Programming -- can be useful in different domains depending on the form of uncertainty to be represented, on the form of programs needed to model problems, and on the scale of the problems to be solved. In this paper, we show how the PITA system, which originally supported the general PLP language of LPADs, can also efficiently support restricted PLP and Possibilistic Logic Programs. PITA relies on tabling with answer subsumption and consists of a transformation along with an API for library functions that interface with answer subsumption. We show that, by adapting its transformation and library functions, PITA can be parameterized to PITA(IND,EXC) which supports the restricted PLP of PRISM, including optimizations that reduce non-discriminating arguments and the computation of Viterbi paths. Furthermore, we show PITA to be competitive with PRISM for complex queries to Hidden Markov Model examples, and sometimes much faster. We further show how PITA can be parameterized to PITA(COUNT) which computes the number of different explanations for a subgoal, and to PITA(POSS) which scalably implements Possibilistic Logic Programming. PITA is a supported package in version 3.3 of XSB. }, keywords = {Probabilistic Logic Programming, Possibilistic Logic Programming, Tabling, Answer Subsumption, Program Transformation}, pages = {433--449}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/RigSwi-ICLP11.pdf}, doi = {10.1017/S147106841100010X}, url = {http://arxiv.org/pdf/1107.4747v1}, arxiv = {1107.4747} }

@article{AlbGavLam11-IA-IJ, author = {Marco Alberti and Marco Gavanelli and Evelina Lamma and Fabrizio Riguzzi and Sergio Storari}, title = {Learning specifications of interaction protocols and business processes and proving their properties}, journal = {Intelligenza artificiale}, year = 2011, volume = 5, number = 1, pages = {71--75}, month = feb, doi = {10.3233/IA-2011-0006}, issn = {1724-8035}, abstract = {In this paper, we overview our recent research activity concerning the induction of Logic Programming specifications, and the proof of their properties via Abductive Logic Programming. Both the inductive and abductive tools here briefly described have been applied to respectively learn and verify (properties of) interaction protocols in multi-agent systems, Web service choreographies, careflows and business processes.}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/AlbGavLam-IA08.pdf} }

@article{BelRig12-IA-IJ, author = {Elena Bellodi and Fabrizio Riguzzi}, title = { Experimentation of an Expectation Maximization Algorithm for Probabilistic Logic Programs}, year = {2012}, journal = {Intelligenza Artificiale}, publisher = {IOS Press}, copyright = {IOS Press}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/BelRig12-IA-IJ.pdf}, abstract = {Statistical Relational Learning and Probabilistic Inductive Logic Programming are two emerging fields that use representation languages able to combine logic and probability. In the field of Logic Programming, the distribution semantics is one of the prominent approaches for representing uncertainty and underlies many languages such as ICL, PRISM, ProbLog and LPADs. Learning the parameters for such languages requires an Expectation Maximization algorithm since their equivalent Bayesian networks contain hidden variables. EMBLEM (EM over BDDs for probabilistic Logic programs Efficient Mining) is an EM algorithm for languages following the distribution semantics that computes expectations directly on the Binary Decision Diagrams that are built for inference. In this paper we present experiments comparing EMBLEM with LeProbLog, Alchemy, CEM, RIB and LFI-ProbLog on six real world datasets. The results show that EMBLEM is able to solve problems on which the other systems fail and it often achieves significantly higher areas under the Precision Recall and the ROC curves in a similar time.}, keywords = {Statistical Relational Learning, Probabilistic Inductive Logic Programming, Probabilistic Logic Programming, Expectation Maximization, Binary Decision Diagrams, Logic Programs with Annotated Disjunctions }, volume = {8}, number = {1}, pages = {3-18}, doi = {10.3233/IA-2012-0027} }

@article{RigDiM12-ML-IJ, author = {Fabrizio Riguzzi and Di Mauro, Nicola}, title = {Applying the Information Bottleneck to Statistical Relational Learning}, year = {2012}, journal = {Machine Learning}, volume = {86}, number = {1}, pages = {89--114}, note = {The original publication is available at \url{http://www.springerlink.com}}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/RigDiM11-ML-IJ.pdf}, doi = {10.1007/s10994-011-5247-6}, publisher = {Springer}, copyright = {Springer}, address = {Heidelberg, Germany}, abstract = {In this paper we propose to apply the Information Bottleneck (IB) approach to the sub-class of Statistical Relational Learning (SRL) languages that are reducible to Bayesian networks. When the resulting networks involve hidden variables, learning these languages requires the use of techniques for learning from incomplete data such as the Expectation Maximization (EM) algorithm. Recently, the IB approach was shown to be able to avoid some of the local maxima in which EM can get trapped when learning with hidden variables. Here we present the algorithm Relational Information Bottleneck (RIB) that learns the parameters of SRL languages reducible to Bayesian Networks. In particular, we present the specialization of RIB to a language belonging to the family of languages based on the distribution semantics, Logic Programs with Annotated Disjunction (LPADs). This language is prototypical for such a family and its equivalent Bayesian networks contain hidden variables. RIB is evaluated on the IMDB, Cora and artificial datasets and compared with LeProbLog, EM, Alchemy and PRISM. The experimental results show that RIB has good performances especially when some logical atoms are unobserved. Moreover, it is particularly suitable when learning from interpretations that share the same Herbrand base.}, keywords = {Statistical Relational Learning, Probabilistic Inductive Logic Programming, Probabilistic Logic Programming, Information Bottleneck, Logic Programs with Annotated Disjunctions } }

@article{DiMFraEta13-IA-IJ, author = {Nicola Di Mauro and Paolo Frasconi and Fabrizio Angiulli and Davide Bacciu and Marco de Gemmis and Floriana Esposito and Nicola Fanizzi and Stefano Ferilli and Marco Gori and Francesca A. Lisi and Pasquale Lops and Donato Malerba and Alessio Micheli and Marcello Pelillo and Francesco Ricci and Fabrizio Riguzzi and Lorenza Saitta and Giovanni Semeraro}, title = {Italian Machine Learning and Data Mining research: The last years}, journal = {Intelligenza Artificiale}, volume = {7}, number = {2}, year = {2013}, pages = {77-89}, doi = {10.3233/IA-130050}, copyright = {{IOS} Press}, publisher = {{IOS} Press}, abstract = {With the increasing amount of information in electronic form the fields of Machine Learning and Data Mining continue to grow by providing new advances in theory, applications and systems. The aim of this paper is to consider some recent theoretical aspects and approaches to ML and DM with an emphasis on the Italian research.} }

@article{Rig13-FI-IJ, author = {Fabrizio Riguzzi}, title = {{MCINTYRE}: A {Monte Carlo} System for Probabilistic Logic Programming}, journal = {Fundamenta Informaticae}, abstract = {Probabilistic Logic Programming is receiving an increasing attention for its ability to model domains with complex and uncertain relations among entities. In this paper we concentrate on the problem of approximate inference in probabilistic logic programming languages based on the distribution semantics. A successful approximate approach is based on Monte Carlo sampling, that consists in verifying the truth of the query in a normal program sampled from the probabilistic program. The ProbLog system includes such an algorithm and so does the cplint suite. In this paper we propose an approach for Monte Carlo inference that is based on a program transformation that translates a probabilistic program into a normal program to which the query can be posed. The current sample is stored in the internal database of the Yap Prolog engine. The resulting system, called MCINTYRE for Monte Carlo INference wiTh Yap REcord, is evaluated on various problems: biological networks, artificial datasets and a hidden Markov model. MCINTYRE is compared with the Monte Carlo algorithms of ProbLog and and with the exact inference of the PITA system. The results show that MCINTYRE is faster than the other Monte Carlo systems.}, keywords = {Probabilistic Logic Programming, Monte Carlo Methods, Logic Programs with Annotated Disjunctions, ProbLog}, year = {2013}, publisher = {{IOS} Press}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/Rig13-FI-IJ.pdf}, doi = {10.3233/FI-2013-847}, volume = {124}, number = {4}, pages = {521-541}, copyright = {IOS Press} }

@article{BelRig13-IDA-IJ, author = {Elena Bellodi and Fabrizio Riguzzi}, title = { Expectation {Maximization} over Binary Decision Diagrams for Probabilistic Logic Programs}, year = {2013}, volume = {17}, number = {2}, journal = {Intelligent Data Analysis}, publisher = {IOS Press}, copyright = {IOS Press}, pages = {343-363}, doi = {10.3233/IDA-130582}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/BelRig13-IDA-IJ.pdf}, abstract = {Recently much work in Machine Learning has concentrated on using expressive representation languages that combine aspects of logic and probability. A whole field has emerged, called Statistical Relational Learning, rich of successful applications in a variety of domains. In this paper we present a Machine Learning technique targeted to Probabilistic Logic Programs, a family of formalisms where uncertainty is represented using Logic Programming tools. Among various proposals for Probabilistic Logic Programming, the one based on the distribution semantics is gaining popularity and is the basis for languages such as ICL, PRISM, ProbLog and Logic Programs with Annotated Disjunctions. This paper proposes a technique for learning parameters of these languages. Since their equivalent Bayesian networks contain hidden variables, an Expectation Maximization (EM) algorithm is adopted. In order to speed the computation up, expectations are computed directly on the Binary Decision Diagrams that are built for inference. The resulting system, called EMBLEM for ``EM over Bdds for probabilistic Logic programs Efficient Mining'', has been applied to a number of datasets and showed good performances both in terms of speed and memory usage. In particular its speed allows the execution of a high number of restarts, resulting in good quality of the solutions.}, keywords = {Statistical Relational Learning, Probabilistic Inductive Logic Programming, Probabilistic Logic Programs, Logic Programs with Annotated Disjunctions, Expectation Maximization, Binary Decision Diagrams } }

@article{RigSwi13-TPLP-IJ, author = {Fabrizio Riguzzi and Terrance Swift}, title = {Well\--Definedness and Efficient Inference for Probabilistic Logic Programming under the Distribution Semantics }, year = {2013}, month = {March}, journal = {Theory and Practice of Logic Programming}, editor = { Wolfgang Faber and Nicola Leone}, publisher = {Cambridge University Press}, copyright = {Cambridge University Press}, keywords = {Probabilistic Logic Programming, Possibilistic Logic Programming, Tabling, Answer Subsumption, Program Transformation}, abstract = {The distribution semantics is one of the most prominent approaches for the combination of logic programming and probability theory. Many languages follow this semantics, such as Independent Choice Logic, PRISM, pD, Logic Programs with Annotated Disjunctions (LPADs) and ProbLog. When a program contains functions symbols, the distribution semantics is well\--defined only if the set of explanations for a query is finite and so is each explanation. Well\--definedness is usually either explicitly imposed or is achieved by severely limiting the class of allowed programs. In this paper we identify a larger class of programs for which the semantics is well\--defined together with an efficient procedure for computing the probability of queries. Since LPADs offer the most general syntax, we present our results for them, but our results are applicable to all languages under the distribution semantics. We present the algorithm ``Probabilistic Inference with Tabling and Answer subsumption'' (PITA) that computes the probability of queries by transforming a probabilistic program into a normal program and then applying SLG resolution with answer subsumption. PITA has been implemented in XSB and tested on six domains: two with function symbols and four without. The execution times are compared with those of ProbLog, cplint and CVE. PITA was almost always able to solve larger problems in a shorter time, on domains with and without function symbols.}, keywords = {Probabilistic Logic Programming, Tabling, Answer Subsumption, Logic Programs with Annotated Disjunction, Program Transformation}, doi = {10.1017/S1471068411000664}, arxiv = {1110.0631}, pages = {279-302}, volume = {13}, number = {Special Issue 02 - 25th Annual GULP Conference}, scopus = {84874625061}, isi = {000315867300007}, url = {http://arxiv.org/pdf/1110.0631v1} }

@article{RigBelZes14-FAI-IJ, author = {Riguzzi, Fabrizio and Bellodi, Elena and Zese, Riccardo}, title = {A History of Probabilistic Inductive Logic Programming}, journal = {Frontiers in Robotics and AI}, volume = {1}, year = {2014}, number = {6}, url = {http://www.frontiersin.org/computational_intelligence/10.3389/frobt.2014.00006/abstract}, doi = {10.3389/frobt.2014.00006}, issn = {2296-9144}, abstract = {The field of Probabilistic Logic Programming (PLP) has seen significant advances in the last 20?years, with many proposals for languages that combine probability with logic programming. Since the start, the problem of learning probabilistic logic programs has been the focus of much attention. Learning these programs represents a whole subfield of Inductive Logic Programming (ILP). In Probabilistic ILP (PILP), two problems are considered: learning the parameters of a program given the structure (the rules) and learning both the structure and the parameters. Usually, structure learning systems use parameter learning as a subroutine. In this article, we present an overview of PILP and discuss the main results.}, pages = {1-5}, keywords = {logic programming, probabilistic programming, inductive logic programming, probabilistic logic programming, statistical relational learning}, copyright = {by the authors} }

@article{RigSwi14-TOCL-IJ, author = { Fabrizio Riguzzi and Terrance Swift}, title = {Terminating Evaluation of Logic Programs with Finite Three-Valued Models}, journal = {ACM Transactions on Computational Logic}, publisher = {ACM}, copyright = {ACM}, volume = {15}, number = {4}, year = {2014}, doi = {10.1145/2629337}, abstract = { As evaluation methods for logic programs have become more sophisticated, the classes of programs for which termination can be guaranteed have expanded. From the perspective of answer set programs that include function symbols, recent work has identified classes for which grounding routines can terminate either on the entire program [Calimeri et al. 2008] or on suitable queries [Baselice et al. 2009]. From the perspective of tabling, it has long been known that a tabling technique called subgoal abstraction provides good termination properties for definite programs [Tamaki and Sato 1986], and this result was recently extended to stratified programs via the class of bounded term-size programs [Riguzzi and Swift 2013]. In this paper we provide a formal definition of tabling with subgoal abstraction resulting in the SLG SA algorithm. Moreover, we discuss a declarative characterization of the queries and programs for which SLG SA terminates. We call this class strongly bounded term-size programs and show its equivalence to programs with finite wellfounded models. For normal programs strongly bounded term-size programs strictly includes the finitely ground programs of [Calimeri et al. 2008]. SLG SA has an asymptotic complexity on strongly bounded termsize programs equal to the best known and produces a residual program that can be sent to an answer set programming system. Finally, we describe the implementation of subgoal abstraction within the SLG-WAM of XSB and provide performance results.}, keywords = {Logic Programming, Tabled Logic Programming, Termination}, http = {http://dl.acm.org/authorize?N05388}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/RigSwi14-TOCL.pdf}, pages = {32:1--32:38}, month = {September}, issn = {1529-3785}, address = {New York, NY, USA} }

@article{BelLamRig14-ICLP-IJ, author = { Elena Bellodi and Evelina Lamma and Fabrizio Riguzzi and Santos Costa, Vitor and Riccardo Zese}, title = {Lifted Variable Elimination for Probabilistic Logic Programming}, journal = {Theory and Practice of Logic Programming}, publisher = {Cambridge University Press}, copyright = {Cambridge University Press}, number = {Special issue 4-5 - ICLP 2014}, volume = {14}, year = {2014}, pages = {681-695}, doi = {10.1017/S1471068414000283}, pdf = {http://arxiv.org/abs/1405.3218}, keywords = {Probabilistic Logic Programming, Lifted Inference, Variable Elimination, Distribution Semantics, ProbLog, Statistical Relational Artificial Intelligence}, abstract = {Lifted inference has been proposed for various probabilistic logical frameworks in order to compute the probability of queries in a time that depends on the size of the domains of the random variables rather than the number of instances. Even if various authors have underlined its importance for probabilistic logic programming (PLP), lifted inference has been applied up to now only to relational languages outside of logic programming. In this paper we adapt Generalized Counting First Order Variable Elimination (GC-FOVE) to the problem of computing the probability of queries to probabilistic logic programs under the distribution semantics. In particular, we extend the Prolog Factor Language (PFL) to include two new types of factors that are needed for representing ProbLog programs. These factors take into account the existing causal independence relationships among random variables and are managed by the extension to variable elimination proposed by Zhang and Poole for dealing with convergent variables and heterogeneous factors. Two new operators are added to GC-FOVE for treating heterogeneous factors. The resulting algorithm, called LP2 for Lifted Probabilistic Logic Programming, has been implemented by modifying the PFL implementation of GC-FOVE and tested on three benchmarks for lifted inference. A comparison with PITA and ProbLog2 shows the potential of the approach.}, isi = {000343203200019}, scopus = {84904624147} }

@article{Rig14-CJ-IJ, author = {Fabrizio Riguzzi}, title = {Speeding Up Inference for Probabilistic Logic Programs}, journal = { The Computer Journal}, publisher = {Oxford University Press}, copyright = {Oxford University Press}, year = {2014}, volume = {57}, number = {3}, pages = {347-363}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/Rig-CJ13.pdf}, doi = {10.1093/comjnl/bxt096}, abstract = {Probabilistic Logic Programming (PLP) allows to represent domains containing many entities connected by uncertain relations and has many applications in particular in Machine Learning. PITA is a PLP algorithm for computing the probability of queries that exploits tabling, answer subsumption and Binary Decision Diagrams (BDDs). PITA does not impose any restriction on the programs. Other algorithms, such as PRISM, reduce computation time by imposing restrictions on the program, namely that subgoals are independent and that clause bodies are mutually exclusive. Another assumption that simplifies inference is that clause bodies are independent. In this paper we present the algorithms PITA(IND,IND) and PITA(OPT). PITA(IND,IND) assumes that subgoals and clause bodies are independent. PITA(OPT) instead first checks whether these assumptions hold for subprograms and subgoals: if they do, PITA(OPT) uses a simplified calculation, otherwise it resorts to BDDs. Experiments on a number of benchmark datasets show that PITA(IND,IND) is the fastest on datasets respecting the assumptions while PITA(OPT) is a good option when nothing is known about a dataset.}, keywords = {Logic Programming, Probabilistic Logic Programming, Distribution Semantics, Logic Programs with Annotated Disjunctions, PRISM, ProbLog} }

@article{DiMBelRig15-ML-IJ, author = {Di Mauro, Nicola and Elena Bellodi and Fabrizio Riguzzi}, title = {Bandit-Based {Monte-Carlo} Structure Learning of Probabilistic Logic Programs}, journal = {Machine Learning}, publisher = {Springer International Publishing}, copyright = {Springer International Publishing}, year = {2015}, volume = {100}, number = {1}, pages = {127-156}, month = {July}, doi = {10.1007/s10994-015-5510-3}, url = {http://ml.unife.it/wp-content/uploads/Papers/DiMBelRig-ML15.pdf}, keywords = {probabilistic inductive logic programming, statistical relational learning, structure learning, distribution semantics, logic programs with annotated disjunction}, abstract = {Probabilistic Logic Programming can be used to model domains with complex and uncertain relationships among entities. While the problem of learning the parameters of such programs has been considered by various authors, the problem of learning the structure is yet to be explored in depth. In this work we present an approximate search method based on a one-player game approach, called LEMUR. It sees the problem of learning the structure of a probabilistic logic program as a multiarmed bandit problem, relying on the Monte-Carlo tree search UCT algorithm that combines the precision of tree search with the generality of random sampling. LEMUR works by modifying the UCT algorithm in a fashion similar to FUSE, that considers a finite unknown horizon and deals with the problem of having a huge branching factor. The proposed system has been tested on various real-world datasets and has shown good performance with respect to other state of the art statistical relational learning approaches in terms of classification abilities.}, note = {The original publication is available at \url{http://link.springer.com}} }

@article{RigBelLamZes15-SW-IJ, author = {Fabrizio Riguzzi and Elena Bellodi and Evelina Lamma and Riccardo Zese}, title = {Probabilistic Description Logics under the Distribution Semantics}, journal = {Semantic Web - Interoperability, Usability, Applicability}, volume = {6}, number = {5}, pages = {447-501}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/RigBelLamZes-SW14.pdf}, year = {2015}, doi = {10.3233/SW-140154}, abstract = { Representing uncertain information is crucial for modeling real world domains. In this paper we present a technique for the integration of probabilistic information in Description Logics (DLs) that is based on the distribution semantics for probabilistic logic programs. In the resulting approach, that we called DISPONTE, the axioms of a probabilistic knowledge base (KB) can be annotated with a real number between 0 and 1. A probabilistic knowledge base then defines a probability distribution over regular KBs called worlds and the probability of a given query can be obtained from the joint distribution of the worlds and the query by marginalization. We present the algorithm BUNDLE for computing the probability of queries from DISPONTE KBs. The algorithm exploits an underlying DL reasoner, such as Pellet, that is able to return explanations for queries. The explanations are encoded in a Binary Decision Diagram from which the probability of the query is computed. The experimentation of BUNDLE shows that it can handle probabilistic KBs of realistic size. }, keywords = { Probabilistic Ontologies, Probabilistic Description Logics, OWL, Probabilistic Logic Programming, Distribution Semantics} }

@article{BelRig15-TPLP-IJ, author = {Elena Bellodi and Fabrizio Riguzzi}, title = {Structure Learning of Probabilistic Logic Programs by Searching the Clause Space}, journal = {Theory and Practice of Logic Programming}, publisher = {Cambridge University Press}, copyright = {Cambridge University Press}, year = {2015}, volume = {15}, number = {2}, pages = {169-212}, pdf = {http://arxiv.org/abs/1309.2080}, url = {http://journals.cambridge.org/abstract_S1471068413000689}, doi = {10.1017/S1471068413000689}, keywords = {probabilistic inductive logic programming, statistical relational learning, structure learning, distribution semantics, logic programs with annotated disjunction, CP-logic}, abstract = {Learning probabilistic logic programming languages is receiving an increasing attention, and systems are available for learning the parameters (PRISM, LeProbLog, LFI-ProbLog and EMBLEM) or both structure and parameters (SEM-CP-logic and SLIPCASE) of these languages. In this paper we present the algorithm SLIPCOVER for "Structure LearnIng of Probabilistic logic programs by searChing OVER the clause space." It performs a beam search in the space of probabilistic clauses and a greedy search in the space of theories using the log likelihood of the data as the guiding heuristics. To estimate the log likelihood, SLIPCOVER performs Expectation Maximization with EMBLEM. The algorithm has been tested on five real world datasets and compared with SLIPCASE, SEM-CP-logic, Aleph and two algorithms for learning Markov Logic Networks (Learning using Structural Motifs (LSM) and ALEPH++ExactL1). SLIPCOVER achieves higher areas under the precision-recall and receiver operating characteristic curves in most cases.} }

@article{RigBelLam16-SPE-IJ, author = {Fabrizio Riguzzi and Elena Bellodi and Evelina Lamma and Riccardo Zese and Giuseppe Cota}, title = {Probabilistic Logic Programming on the Web}, journal = {Software: Practice and Experience}, publisher = {Wiley}, copyright = {Wiley}, year = {2016}, issn = {1097-024X}, url = {http://ml.unife.it/wp-content/uploads/Papers/RigBelLam-SPE16.pdf}, abstract = { We present the web application "cplint on SWISH", that allows the user to write probabilistic logic programs and compute the probability of queries with just a web browser. The application is based on SWISH, a recently proposed web framework for logic programming. SWISH is based on various features and packages of SWI-Prolog, in particular its web server and its Pengine library, that allow to create remote Prolog engines and to pose queries to them. In order to develop the web application, we started from the PITA system which is included in cplint, a suite of programs for reasoning on Logic Programs with Annotated Disjunctions, by porting PITA to SWI-Prolog. Moreover, we modified the PITA library so that it can be executed in a multi-threading environment. Developing "cplint on SWISH" also required modification of the JavaScript SWISH code that creates and queries Pengines. "cplint on SWISH" includes a number of examples that cover a wide range of domains and provide interesting applications of Probabilistic Logic Programming (PLP). By providing a web interface to cplint we allow users to experiment with PLP without the need to install a system, a procedure which is often complex, error prone and limited mainly to the Linux platform. In this way, we aim to reach out to a wider audience and popularize PLP.}, keywords = { Logic Programming, Probabilistic Logic Programming, Distribution Semantics, Logic Programs with Annotated Disjunctions, Web Applications }, doi = {10.1002/spe.2386}, volume = {46}, number = {10}, pages = {1381-1396}, month = {October}, wos = {WOS:000383624900005}, scopus = {2-s2.0-84951829971} }

@article{Rig16-IJAR-IJ, author = {Fabrizio Riguzzi}, title = {The Distribution Semantics for Normal Programs with Function Symbols}, journal = {International Journal of Approximate Reasoning}, year = {2016}, publisher = {Elsevier}, address = {Amsterdam}, doi = {10.1016/j.ijar.2016.05.005}, volume = {77}, number = {Supplement C}, pages = {1 - 19}, issn = {0888-613X}, month = {October}, url = {http://ml.unife.it/wp-content/uploads/Papers/Rig-IJAR16.pdf}, copyright = {Elsevier}, abstract = {The distribution semantics integrates logic programming and probability theory using a possible worlds approach. Its intuitiveness and simplicity has made it the most widely used semantics for probabilistic logic programming, with successful applications in many domains. When the program has function symbols, the semantics was defined for special cases: either the program has to be definite or the queries must have a finite number of finite explanations. In this paper we show that it is possible to define the semantics for all programs. We also show that this definition coincides with that of Sato and Kameya on positive programs. Moreover, we highlight possible approaches for inference, both exact and approximate. }, keywords = {Distribution Semantics, Function Symbols, ProbLog, Probabilistic Logic Programming }, wos = {WOS:000381164500001}, scopus = {2-s2.0-84973659532} }

@article{BelRigLam16-IDA-IJ, author = {Elena Bellodi and Fabrizio Riguzzi and Evelina Lamma}, title = {Statistical Relational Learning for Workflow Mining}, journal = {Intelligent Data Analysis}, publisher = {IOS Press}, copyright = {IOS Press}, year = {2016}, doi = {10.3233/IDA-160818}, month = {April}, volume = {20}, number = {3}, pages = {515-541}, url = {http://ml.unife.it/wp-content/uploads/Papers/BelRigLam-IDA15.pdf}, keywords = {Workflow Mining, Process Mining, Knowledge-based Process Models, Inductive Logic Programming, Statistical Relational Learning, Business Process Management }, abstract = { The management of business processes can support efficiency improvements in organizations. One of the most interesting problems is the mining and representation of process models in a declarative language. Various recently proposed knowledge-based languages showed advantages over graph-based procedural notations. Moreover, rapid changes of the environment require organizations to check how compliant are new process instances with the deployed models. We present a Statistical Relational Learning approach to Workflow Mining that takes into account both flexibility and uncertainty in real environments. It performs automatic discovery of process models expressed in a probabilistic logic. It uses the existing DPML algorithm for extracting first-order logic constraints from process logs. The constraints are then translated into Markov Logic to learn their weights. Inference on the resulting Markov Logic model allows a probabilistic classification of test traces, by assigning them the probability of being compliant to the model. We applied this approach to three datasets and compared it with DPML alone, five Petri net- and EPC-based process mining algorithms and Tilde. The technique is able to better classify new execution traces, showing higher accuracy and areas under the PR/ROC curves in most cases. }, scopus = {2-s2.0-84969808336}, wos = {WOS:000375005000004} }

@article{RigCotBel17-IJAR-IJ, author = {Fabrizio Riguzzi and Giuseppe Cota and Elena Bellodi and Riccardo Zese }, title = {Causal Inference in {cplint}}, journal = {International Journal of Approximate Reasoning}, year = {2017}, publisher = {Elsevier}, address = {Amsterdam}, copyright = {Elsevier}, doi = {10.1016/j.ijar.2017.09.007}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/RigCotBel-IJAR17.pdf}, abstract = { cplint is a suite of programs for reasoning and learning with Probabilistic Logic Programming languages that follow the distribution semantics. In this paper we describe how we have extended cplint to perform causal reasoning. In particular, we consider Pearl's do calculus for models where all the variables are measured. The two cplint modules for inference, PITA and MCINTYRE, have been extended for computing the effect of actions/interventions on these models. We also executed experiments comparing exact and approximate inference with conditional and causal queries, showing that causal inference is often cheaper than conditional inference. }, keywords = { Probabilistic Logic Programming, Distribution Semantics, Logic Programs with Annotated Disjunctions, ProbLog, Causal Inference, Statistical Relational Artificial Intelligence }, volume = {91}, pages = {216-232}, month = {December}, number = {Supplement C}, issn = {0888-613X}, scopus = {2-s2.0-84992199737}, wos = {WOS:000391080100020} }

@article{AlbBelCot17-IA-IJ, author = {Marco Alberti and Elena Bellodi and Giuseppe Cota and Fabrizio Riguzzi and Riccardo Zese}, title = {\texttt{cplint} on {SWISH}: Probabilistic Logical Inference with a Web Browser}, journal = {Intelligenza Artificiale}, publisher = {IOS Press}, copyright = {IOS Press}, year = {2017}, issn-print = {1724-8035}, issn-online = {2211-0097}, url = {http://ml.unife.it/wp-content/uploads/Papers/AlbBelCot-IA17.pdf}, abstract = { \texttt{cplint} on SWISH is a web application that allows users to perform reasoning tasks on probabilistic logic programs. Both inference and learning systems can be performed: conditional probabilities with exact, rejection sampling and Metropolis-Hasting methods. Moreover, the system now allows hybrid programs, i.e., programs where some of the random variables are continuous. To perform inference on such programs likelihood weighting and particle filtering are used. \texttt{cplint} on SWISH is also able to sample goals' arguments and to graph the results. This paper reports on advances and new features of \texttt{cplint} on SWISH, including the capability of drawing the binary decision diagrams created during the inference processes. }, keywords = { Logic Programming, Probabilistic Logic Programming, Distribution Semantics, Logic Programs with Annotated Disjunctions, Web Applications }, volume = {11}, number = {1}, doi = {10.3233/IA-170106}, pages = {47--64}, wos = {WOS:000399736500004} }

@article{BelLamRig17-SPE-IJ, author = {Elena Bellodi and Evelina Lamma and Fabrizio Riguzzi and Riccardo Zese and Giuseppe Cota}, title = {A web system for reasoning with probabilistic {OWL}}, journal = {Software: Practice and Experience}, publisher = {Wiley}, copyright = {Wiley}, year = {2017}, doi = {10.1002/spe.2410}, issn = {1097-024X}, month = {January}, pages = {125--142}, volume = {47}, number = {1}, scopus = {2-s2.0-84992412060}, url = {http://ml.unife.it/wp-content/uploads/Papers/BelLamRig-SPE16.pdf}, abstract = { We present the web application TRILL on SWISH, which allows the user to write probabilistic Description Logic (DL) theories and compute the probability of queries with just a web browser. Various probabilistic extensions of DLs have been proposed in the recent past, since uncertainty is a fundamental component of the Semantic Web. We consider probabilistic DL theories following our DISPONTE semantics. Axioms of a DISPONTE Knowledge Base (KB) can be annotated with a probability and the probability of queries can be computed with inference algorithms. TRILL is a probabilistic reasoner for DISPONTE KBs that is implemented in Prolog and exploits its backtracking facilities for handling the non-determinism of the tableau algorithm. TRILL on SWISH is based on SWISH, a recently proposed web framework for logic programming, based on various features and packages of SWI-Prolog (e.g., a web server and a library for creating remote Prolog engines and posing queries to them). TRILL on SWISH also allows users to cooperate in writing a probabilistic DL theory. It is free, open, and accessible on the Web at the url: \trillurl; it includes a number of examples that cover a wide range of domains and provide interesting Probabilistic Semantic Web applications. By building a web-based system, we allow users to experiment with Probabilistic DLs without the need to install a complex software stack. In this way we aim to reach out to a wider audience and popularize the Probabilistic Semantic Web. }, keywords = { Semantic Web, Web Applications, Description Logics, Probabilistic Description Logics, SWI-Prolog, Logic Programming } }

@article{RigBelZes17-IJAR-IJ, author = {Fabrizio Riguzzi and Elena Bellodi and Riccardo Zese and Giuseppe Cota and Evelina Lamma }, title = {A Survey of Lifted Inference Approaches for Probabilistic Logic Programming under the Distribution Semantics}, journal = {International Journal of Approximate Reasoning}, year = {2017}, publisher = {Elsevier}, address = {Amsterdam}, copyright = {Elsevier}, doi = {10.1016/j.ijar.2016.10.002}, url = {http://ml.unife.it/wp-content/uploads/Papers/RigBelZes-IJAR17.pdf}, volume = {80}, number = {Supplement C}, issn = {0888-613X}, pages = {313--333}, month = {January}, abstract = { Lifted inference aims at answering queries from statistical relational models by reasoning on populations of individuals as a whole instead of considering each individual singularly. Since the initial proposal by David Poole in 2003, many lifted inference techniques have appeared, by lifting different algorithms or using approximation involving different kinds of models, including parfactor graphs and Markov Logic Networks. Very recently lifted inference was applied to Probabilistic Logic Programming (PLP) under the distribution semantics, with proposals such as LP2 and Weighted First-Order Model Counting (WFOMC). Moreover, techniques for dealing with aggregation parfactors can be directly applied to PLP. In this paper we survey these approaches and present an experimental comparison on five models. The results show that WFOMC outperforms the other approaches, being able to exploit more symmetries. }, keywords = {Probabilistic Logic Programming, Lifted Inference, Variable Elimination, Distribution Semantics, ProbLog, Statistical Relational Artificial Intelligence }, scopus = {2-s2.0-84992199737}, wos = {WOS:000391080100020} }

@article{ZesBelRig18-AMAI-IJ, author = {Riccardo Zese and Elena Bellodi and Fabrizio Riguzzi and Giuseppe Cota and Evelina Lamma }, title = {Tableau Reasoning for Description Logics and its Extension to Probabilities}, journal = {Annals of Mathematics and Artificial Intelligence}, publisher = {Springer}, copyright = {Springer}, year = {2018}, issn-print = {1012-2443}, issn-online = {1573-7470}, url = {http://ml.unife.it/wp-content/uploads/Papers/ZesBelRig-AMAI16.pdf}, pdf = {http://rdcu.be/kONG}, month = {March}, day = {01}, volume = {82}, number = {1}, pages = {101--130}, doi = {10.1007/s10472-016-9529-3}, abstract = { The increasing popularity of the Semantic Web drove to a wide- spread adoption of Description Logics (DLs) for modeling real world domains. To help the diffusion of DLs, a large number of reasoning algorithms have been developed. Usually these algorithms are implemented in procedural languages such as Java or C++. Most of the reasoners exploit the tableau algorithm which features non-determinism, that is not easily handled by those languages. Prolog directly manages non-determinism, thus is a good candidate for dealing with the tableau's non-deterministic expansion rules. We present TRILL, for "Tableau Reasoner for descrIption Logics in pro- Log", that implements a tableau algorithm and is able to return explanations for queries and their corresponding probability, and TRILLP , for "TRILL powered by Pinpointing formulas", which is able to compute a Boolean for- mula representing the set of explanations for a query. Reasoning on real world domains also requires the capability of managing probabilistic and uncertain information. We show how TRILL and TRILLP can be used to compute the probability of queries to knowledge bases following DISPONTE semantics. Experiments comparing these with other systems show the feasibility of the approach.}, keywords = { Description Logics, Tableau, Prolog, Semantic Web}, scopus = {2-s2.0-84990986085} }

@article{GavLam18-FI-IJ, author = {Gavanelli, Marco and Lamma, Evelina and Riguzzi, Fabrizio and Bellodi, Elena and Zese, Riccardo and Cota, Giuseppe}, title = {Reasoning on Datalog+- Ontologies with Abductive Logic Programming}, year = {2018}, journal = {Fundamenta Informaticae}, copyright = {IOS Press}, volume = {159}, doi = {10.3233/FI-2018-1658}, pages = {65--93}, pdf = {http://ml.unife.it/wp-content/uploads/Papers/GavLam-FI18.pdf}, scopus = {2-s2.0-85043572529} }

@article{AzzRigLam19-Info-IJ, author = {Damiano Azzolini and Fabrizio Riguzzi and Evelina Lamma}, title = {Studying Transaction Fees in the Bitcoin Blockchain with Probabilistic Logic Programming}, journal = {Information}, publisher = {MDPI}, copyright = {CCBY}, year = {2019}, pdf = {https://www.mdpi.com/2078-2489/10/11/335/pdf}, doi = {10.3390/info10110335}, abstract = { In Bitcoin, if a miner is able to solve a computationally hard problem called proof of work, it will receive an amount of bitcoin as a reward which is the sum of the fees for the transactions included in a block plus an amount inversely proportional to the number of blocks discovered so far. At the moment of writing, the block reward is several orders of magnitude greater than the sum of transaction fees. Usually, miners try to collect the largest reward by including transactions associated with high fees. The main purpose of transaction fees is to prevent network spamming. However, they are also used to prioritize transactions. In order to use the minimum amount of fees, users usually have to find a compromise between fees and urgency of a transaction. In this paper, we develop a probabilistic logic model to experimentally analyze how fees affect confirmation time and miner's revenue and to predict if an increase of average fees will generate a situation when the miner gets more reward by not following the protocol.}, keywords = { bitcoin, blockchain, probabilistic logic programming }, address = {Basel, Switzerland}, volume = {10}, number = {11}, pages = {335} }

@article{NguRig19-ML-IJ, author = {Nguembang Fadja, Arnaud and Fabrizio Riguzzi}, title = {Lifted Discriminative Learning of Probabilistic Logic Programs}, journal = {Machine Learning}, publisher = {Springer}, copyright = {Springer}, year = {2019}, doi = {10.1007/s10994-018-5750-0}, abstract = { Probabilistic logic programming (PLP) provides a powerful tool for reason- ing with uncertain relational models. However, learning probabilistic logic programs is expensive due to the high cost of inference. Among the proposals to overcome this problem, one of the most promising is lifted inference. In this paper we consider PLP models that are amenable to lifted inference and present an algorithm for performing parameter and structure learning of these models from positive and negative exam- ples. We discuss parameter learning with EM and LBFGS and structure learning with LIFTCOVER, an algorithm similar to SLIPCOVER. The results of the comparison of LIFTCOVER with SLIPCOVER on 12 datasets show that it can achieve solutions of similar or better quality in a fraction of the time. }, keywords = { Statistical Relational Learning, Probabilistic Inductive Logic Program- ming, Probabilistic Logic Programming, Lifted Inference, Expectation Maximization }, scopus = {2-s2.0-85052570852}, volume = {108}, number = {7}, pages = {1111--1135} }

@article{ZesBelCot19-TPLP-IJ, title = {Probabilistic {DL} Reasoning with Pinpointing Formulas: A Prolog-based Approach}, doi = {10.1017/S1471068418000480}, journal = {Theory and Practice of Logic Programming}, publisher = {Cambridge University Press}, copyright = {Cambridge University Press}, author = {Zese, Riccardo and Cota, Giuseppe and Lamma, Evelina and Bellodi, Elena and Riguzzi, Fabrizio}, pages = {449--476}, year = {2019}, volume = {19}, number = {3}, pdf = {https://arxiv.org/pdf/1809.06180.pdf}, scopus = {2-s2.0-85060024345}, doi = {10.1017/S1471068418000480} }

@article{WieRigKow19-TPLP-IJ, author = { Jan Wielemaker and Fabrizio Riguzzi and Bob Kowalski and Torbj\"orn Lager and Fariba Sadri and Miguel Calejo }, title = {Using {SWISH} to realise interactive web based tutorials for logic based languages }, journal = {Theory and Practice of Logic Programming}, year = {2019}, volume = {19}, doi = {10.1017/S1471068418000522}, number = {2}, publisher = {Cambridge University Press}, copyright = {Cambridge University Press}, pages = {229-261}, pdf = {https://arxiv.org/pdf/1808.08042.pdf}, abstrac = {Programming environments have evolved from purely text based to using graphical user interfaces, and now we see a move toward web-based interfaces, such as Jupyter. Web-based interfaces allow for the creation of interactive documents that consist of text and programs, as well as their output. The output can be rendered using web technology as, for example, text, tables, charts, or graphs. This approach is particularly suitable for capturing data analysis workflows and creating interactive educational material. This article describes SWISH, a web front-end for Prolog that consists of a web server implemented in SWI-Prolog and a client web application written in JavaScript. SWISH provides a web server where multiple users can manipulate and run the same material, and it can be adapted to support Prolog extensions. In this article we describe the architecture of SWISH, and describe two case studies of extensions of Prolog, namely Probabilistic Logic Programming and Logic Production System, which have used SWISH to provide tutorial sites.}, keywords = {Prolog, logic programming system, notebook interface, web}, scopus = {2-s2.0-85061599946} }

@article{AlbGavLam20-FI-IJ, author = {Marco Alberti and Marco Gavanelli and Evelina Lamma and Fabrizio Riguzzi and Ken Satoh and Riccardo Zese}, title = {Dischargeable Obligations in the {SCIFF} Framework}, journal = {Fundamenta Informaticae}, volume = {176}, number = {3-4}, pages = {321--348}, year = {2020}, doi = {10.3233/FI-2020-1976}, publisher = {IOS Press} }

@article{CheCotGavLamMelRig20-EAAI-IJ, author = {Federico Chesani and Giuseppe Cota and Marco Gavanelli and Evelina Lamma and Paola Mello and Fabrizio Riguzzi}, title = {Declarative and Mathematical Programming approaches to Decision Support Systems for food recycling}, journal = {Engineering Applications of Artificial Intelligence}, volume = {95}, pages = {103861}, year = {2020}, doi = {10.1016/j.engappai.2020.103861}, scopus = {2-s2.0-85089188550} }

@article{BelAlbRig20-TPLP-IJ, author = {Elena Bellodi and Marco Alberti and Fabrizio Riguzzi and Riccardo Zese}, title = {{MAP} Inference for Probabilistic Logic Programming}, journal = {Theory and Practice of Logic Programming}, publisher = {Cambridge University Press}, copyright = {Cambridge University Press}, year = {2020}, url = {https://arxiv.org/abs/2008.01394}, volume = {20}, doi = {10.1017/S1471068420000174}, pdf = {https://arxiv.org/pdf/2008.01394.pdf}, number = {5}, pages = {641--655} }

@article{NguRigBerTru2021-BioDM-IJ, abstract = {With the increase in the size of genomic datasets describing variability in populations, extracting relevant information becomes increasingly useful as well as complex. Recently, computational methodologies such as Supervised Machine Learning and specifically Convolutional Neural Networks have been proposed to make inferences on demographic and adaptive processes using genomic data. Even though it was already shown to be powerful and efficient in different fields of investigation, Supervised Machine Learning has still to be explored as to unfold its enormous potential in evolutionary genomics.}, author = {Nguembang Fadja, Arnaud and Riguzzi, Fabrizio and Bertorelle, Giorgio and Trucchi, Emiliano}, doi = {10.1186/s13040-021-00280-9}, isbn = {1756-0381}, journal = {BioData Mining}, number = {1}, pages = {51}, title = {Identification of natural selection in genomic data with deep convolutional neural network}, volume = {14}, year = {2021} }

@article{FraLamRig21-ML-IJ, title = {Symbolic {DNN-Tuner}}, author = {Michele Fraccaroli and Evelina Lamma and Fabrizio Riguzzi}, journal = {Machine Learning}, publisher = {Springer}, copyright = {Springer}, year = {2021}, abstract = {Hyper-Parameter Optimization (HPO) occupies a fundamental role in Deep Learning systems due to the number of hyper-parameters (HPs) to be set. The state-of-the-art of HPO methods are Grid Search, Random Search and Bayesian Optimization. The rst two methods try all possible combinations and random combination of the HPs values, respectively. This is performed in a blind manner, without any information for choosing the new set of HPs val- ues. Bayesian Optimization (BO), instead, keeps track of past results and uses them to build a probabilistic model mapping HPs into a probability density of the objective function. Bayesian Optimization builds a surrogate probabilistic model of the objective function, nds the HPs values that perform best on the surrogate model and updates it with new results. In this paper, we improve BO applied to Deep Neural Network (DNN) by adding an analysis of the results of the network on training and validation sets. This analysis is performed by exploiting rule-based programming, and in particular by using Probabilistic Logic Programming. The resulting system, called Symbolic DNN-Tuner, logi- cally evaluates the results obtained from the training and the validation phase and, by applying symbolic tuning rules, xes the network architecture, and its HPs, therefore improving performance. We also show the e ectiveness of the proposed approach, by an experimental evaluation on literature and real-life datasets.}, keywords = {Deep Learning Hyper-Parameter Optimization Probabilistic Logic Programming}, doi = {10.1007/s10994-021-06097-1}, isbn = {1573-0565} }

@article{NguRigLam21-ML-IJ, author = {Nguembang Fadja, Arnaud and Fabrizio Riguzzi and Evelina Lamma}, title = {Learning Hierarchical Probabilistic Logic Programs}, journal = {Machine Learning}, publisher = {Springer}, copyright = {Springer}, year = {2021}, doi = {10.1007/s10994-021-06016-4}, url = {https://link.springer.com/content/pdf/10.1007/s10994-021-06016-4.pdf}, abstract = { Probabilistic logic programming (PLP) combines logic programs and probabilities. Due to its expressiveness and simplicity, it has been considered as a powerful tool for learning and reasoning in relational domains characterized by uncertainty. Still, learning the parameter and the structure of general PLP is computationally expensive due to the inference cost. We have recently proposed a restriction of the general PLP language called hierarchical PLP (HPLP) in which clauses and predicates are hierarchically organized. HPLPs can be converted into arithmetic circuits or deep neural networks and inference is much cheaper than for general PLP. In this paper we present algorithms for learning both the parameters and the structure of HPLPs from data. We first present an algorithm, called parameter learning for hierarchical probabilistic logic programs (PHIL) which performs parameter estimation of HPLPs using gradient descent and expectation maximization. We also propose structure learning of hierarchical probabilistic logic programming (SLEAHP), that learns both the structure and the parameters of HPLPs from data. Experiments were performed comparing PHIL and SLEAHP with PLP and Markov Logic Networks state-of-the art systems for parameter and structure learning respectively. PHIL was compared with EMBLEM, ProbLog2 and Tuffy and SLEAHP with SLIPCOVER, PROBFOIL+, MLB-BC, MLN-BT and RDN-B. The experiments on five well known datasets show that our algorithms achieve similar and often better accuracies but in a shorter time. }, keywords = {Probabilistic Logic Programming, Distribution Semantics, Arithmetic Circuits, Gradient Descent, Back-propagation}, address = {Berlin, Germany}, scopus = {2-s2.0-85107994928}, volume = {110}, number = {7}, pages = {1637--1693}, isbn = {1573-0565} }

@article{AzzRig21-ICLP-IJ, title = {Optimizing Probabilities in Probabilistic Logic Programs}, doi = {10.1017/S1471068421000260}, journal = {Theory and Practice of Logic Programming}, publisher = {Cambridge University Press}, copyright = {Cambridge University Press}, author = {Azzolini, Damiano and Riguzzi, Fabrizio}, year = {2021}, volume = {21}, number = {5}, pages = {543--556}, url = {https://arxiv.org/pdf/2108.03095}, pdf = {https://arxiv.org/pdf/2108.03095.pdf} }

@article{AzzRigLam21-AIJ-IJ, title = {A Semantics for Hybrid Probabilistic Logic Programs with Function Symbols}, author = {Azzolini, Damiano and Riguzzi, Fabrizio and Lamma, Evelina}, journal = {Artificial Intelligence}, year = {2021}, copyright = {Elsevier}, issn = {0004-3702}, url = {http://ml.unife.it/wp-content/uploads/Papers/AzzRigLam21-AIJ-IJ.pdf}, doi = {10.1016/j.artint.2021.103452}, note = {The final publication is available at Elsevier via \url{https://doi.org/10.1016/j.artint.2021.103452} }, volume = {294}, pages = {103452} }

@article{LosVen21-JEGTP-IJ, author = {Losi, Enzo and Venturini, Mauro and Manservigi, Lucrezia and Ceschini, Giuseppe Fabio and Bechini, Giovanni and Cota, Giuseppe and Riguzzi, Fabrizio}, title = {Structured Methodology for Clustering Gas Turbine Transients by means of Multi-variate Time Series}, year = {2021}, publisher = {ASME}, journal = {Journal of Engineering for Gas Turbines and Power}, volume = {143}, number = {3}, pages = {031014-1 (13 pages)}, doi = {10.1115/1.4049503} }

@article{RigBelZesAlbLam21-ML-IJ, author = {Riguzzi, Fabrizio and Bellodi, Elena and Zese, Riccardo and Alberti, Marco and Lamma, Evelina}, title = {Probabilistic inductive constraint logic}, journal = {Machine Learning}, year = {2021}, volume = {110}, issue = {4}, pages = {723-754}, doi = {10.1007/s10994-020-05911-6}, pdf = {https://link.springer.com/content/pdf/10.1007/s10994-020-05911-6.pdf}, publisher = {Springer}, issn = {08856125}, abstract = {Probabilistic logical models deal effectively with uncertain relations and entities typical of many real world domains. In the field of probabilistic logic programming usually the aim is to learn these kinds of models to predict specific atoms or predicates of the domain, called target atoms/predicates. However, it might also be useful to learn classifiers for interpretations as a whole: to this end, we consider the models produced by the inductive constraint logic system, represented by sets of integrity constraints, and we propose a probabilistic version of them. Each integrity constraint is annotated with a probability, and the resulting probabilistic logical constraint model assigns a probability of being positive to interpretations. To learn both the structure and the parameters of such probabilistic models we propose the system PASCAL for “probabilistic inductive constraint logic”. Parameter learning can be performed using gradient descent or L-BFGS. PASCAL has been tested on 11 datasets and compared with a few statistical relational systems and a system that builds relational decision trees (TILDE): we demonstrate that this system achieves better or comparable results in terms of area under the precision–recall and receiver operating characteristic curves, in a comparable execution time.} }

@article{BelAlbRig21-TPLP-IJ, author = {Elena Bellodi and Marco Gavanelli and Riccardo Zese and Evelina Lamma and Fabrizio Riguzzi}, title = {Nonground Abductive Logic Programming with Probabilistic Integrity Constraints}, journal = {Theory and Practice of Logic Programming}, publisher = {Cambridge University Press}, copyright = {Cambridge University Press}, year = {2021}, url = {https://arxiv.org/abs/2108.03033}, volume = {21}, doi = {10.1017/S1471068421000417}, pdf = {https://arxiv.org/pdf/2108.03033.pdf}, number = {5}, pages = {557--574} }

@unpublished{RigMyk22-SSRN-IJ, author = {Riguzzi, Fabrizio and Mykhailova, Mariia}, title = {Quantum Algorithms for {WMC}, {MPE} and {MAP}}, note = {Available at SSRN}, url = {https://ssrn.com/abstract=4169880} }

@article{RocChiNal2022-APPSCI-IJ, author = {Rocchi, Alessandro and Chiozzi, Andrea and Nale, Marco and Nikolic, Zeljana and Riguzzi, Fabrizio and Mantovan, Luana and Gilli, Alessandro and Benvenuti, Elena}, title = {A Machine Learning Framework for Multi-Hazard Risk Assessment at the Regional Scale in Earthquake and Flood-Prone Areas}, journal = {Applied Sciences}, volume = {12}, year = {2022}, number = {2}, article-number = {583}, url = {https://www.mdpi.com/2076-3417/12/2/583}, issn = {2076-3417}, abstract = {Communities are confronted with the rapidly growing impact of disasters, due to many factors that cause an increase in the vulnerability of society combined with an increase in hazardous events such as earthquakes and floods. The possible impacts of such events are large, also in developed countries, and governments and stakeholders must adopt risk reduction strategies at different levels of management stages of the communities. This study is aimed at proposing a sound qualitative multi-hazard risk analysis methodology for the assessment of combined seismic and hydraulic risk at the regional scale, which can assist governments and stakeholders in decision making and prioritization of interventions. The method is based on the use of machine learning techniques to aggregate large datasets made of many variables different in nature each of which carries information related to specific risk components and clusterize observations. The framework is applied to the case study of the Emilia Romagna region, for which the different municipalities are grouped into four homogeneous clusters ranked in terms of relative levels of combined risk. The proposed approach proves to be robust and delivers a very useful tool for hazard management and disaster mitigation, particularly for multi-hazard modeling at the regional scale.}, doi = {10.3390/app12020583} }

@article{AzzBellFer2022-IJAR-IJ, title = {Abduction with probabilistic logic programming under the distribution semantics}, journal = {International Journal of Approximate Reasoning}, volume = {142}, pages = {41-63}, year = {2022}, issn = {0888-613X}, doi = {10.1016/j.ijar.2021.11.003}, url = {https://www.sciencedirect.com/science/article/pii/S0888613X2100181X}, author = {Damiano Azzolini and Elena Bellodi and Stefano Ferilli and Fabrizio Riguzzi and Riccardo Zese}, keywords = {Abduction, Distribution semantics, Probabilistic logic programming, Statistical relational artificial intelligence}, abstract = {In Probabilistic Abductive Logic Programming we are given a probabilistic logic program, a set of abducible facts, and a set of constraints. Inference in probabilistic abductive logic programs aims to find a subset of the abducible facts that is compatible with the constraints and that maximizes the joint probability of the query and the constraints. In this paper, we extend the PITA reasoner with an algorithm to perform abduction on probabilistic abductive logic programs exploiting Binary Decision Diagrams. Tests on several synthetic datasets show the effectiveness of our approach.}, scopus = {2-s2.0-85119493622} }

@article{FraLamRig2022-SwX-IJ, title = {Symbolic {DNN-Tuner}: A {Python} and {ProbLog}-based system for optimizing Deep Neural Networks hyperparameters}, journal = {SoftwareX}, volume = {17}, pages = {100957}, year = {2022}, issn = {2352-7110}, doi = {10.1016/j.softx.2021.100957}, url = {https://www.sciencedirect.com/science/article/pii/S2352711021001825}, author = {Michele Fraccaroli and Evelina Lamma and Fabrizio Riguzzi}, keywords = {Deep learning, Probabilistic Logic Programming, Hyper-parameters tuning, Neural-symbolic integration}, abstract = {The application of deep learning models to increasingly complex contexts has led to a rise in the complexity of the models themselves. Due to this, there is an increase in the number of hyper-parameters (HPs) to be set and Hyper-Parameter Optimization (HPO) algorithms occupy a fundamental role in deep learning. Bayesian Optimization (BO) is the state-of-the-art of HPO for deep learning models. BO keeps track of past results and uses them to build a probabilistic model, building a probability density of HPs. This work aims to improve BO applied to Deep Neural Networks (DNNs) by an analysis of the results of the network on training and validation sets. This analysis is obtained by applying symbolic tuning rules, implemented in Probabilistic Logic Programming (PLP). The resulting system, called Symbolic DNN-Tuner, logically evaluates the results obtained from the training and the validation phase and, by applying symbolic tuning rules, fixes the network architecture, and its HPs, leading to improved performance. In this paper, we present the general system and its implementation. We also show its graphical interface and a simple example of execution.} }

@article{LosVen22-JEGTP-IJ, author = {Losi, Enzo and Venturini, Mauro and Manservigi, Lucrezia and Ceschini, Giuseppe Fabio and Bechini, Giovanni and Cota, Giuseppe and Riguzzi, Fabrizio}, title = {Prediction of Gas Turbine Trip: A Novel Methodology Based on Random Forest Models}, journal = {Journal of Engineering for Gas Turbines and Power}, volume = {144}, number = {3}, year = {2022}, issn = {0742-4795}, doi = {10.1115/1.4053194}, publisher = asme_p, note = {{GTP-21-1324}} }

@article{AzzRig2022-CRYPT-IJ, author = {Azzolini, Damiano and Riguzzi, Fabrizio}, title = {Probabilistic Logic Models for the Lightning Network}, journal = {Cryptography}, volume = {6}, year = {2022}, number = {2}, article-number = {29}, url = {https://www.mdpi.com/2410-387X/6/2/29}, pdf = {https://www.mdpi.com/2410-387X/6/2/29/pdf?version=1655360685}, issn = {2410-387X}, doi = {10.3390/cryptography6020029} }

@article{AzzRig23-IJAR-IJ, title = {Lifted Inference for Statistical Statements in Probabilistic Answer Set Programming}, author = {Damiano Azzolini and Fabrizio Riguzzi}, journal = {International Journal of Approximate Reasoning}, year = {2023}, doi = {10.1016/j.ijar.2023.109040}, pages = {109040}, volume = {163}, issn = {0888-613X}, url = {https://www.sciencedirect.com/science/article/pii/S0888613X23001718}, keywords = {Statistical statements, Probabilistic answer set programming, Lifted inference}, abstract = {In 1990, Halpern proposed the distinction between Type 1 and Type 2 statements: the former express statistical information about a domain of interest while the latter define a degree of belief. An example of Type 1 statement is “30% of the elements of a domain share the same property” while an example of Type 2 statement is “the element x has the property y with probability p”. Recently, Type 1 statements were given an interpretation in terms of probabilistic answer set programs under the credal semantics in the PASTA framework. The algorithm proposed for inference requires the enumeration of all the answer sets of a given program, and so it is impractical for domains of not trivial size. The field of lifted inference aims to identify programs where inference can be computed without grounding the program. In this paper, we identify some classes of PASTA programs for which we apply lifted inference and develop compact formulas to compute the probability bounds of a query without the need to generate all the possible answer sets.}, scopus = {2-s2.0-85174067981} }

@article{SchVDBRig23-TPLP-IJ, title = {Automatic Differentiation in Prolog}, doi = {10.1017/S1471068423000145}, journal = {Theory and Practice of Logic Programming}, publisher = {Cambridge University Press}, author = {Schrijvers, Tom and Van Den Berg, Birthe and Riguzzi, Fabrizio}, year = {2023}, pages = {900–917}, volume = {23}, number = {4}, pdf = {https://arxiv.org/pdf/2305.07878.pdf} }

@article{GreSalFab23-Biomed-IJ, author = {Greco, Salvatore and Salatiello, Alessandro and Fabbri, Nicolò and Riguzzi, Fabrizio and Locorotondo, Emanuele and Spaggiari, Riccardo and De Giorgi, Alfredo and Passaro, Angelina}, title = {Rapid Assessment of {COVID-19} Mortality Risk with {GASS} Classifiers}, journal = {Biomedicines}, volume = {11}, year = {2023}, number = {3}, article-number = {831}, url = {https://www.mdpi.com/2227-9059/11/3/831}, issn = {2227-9059}, abstract = {Risk prediction models are fundamental to effectively triage incoming COVID-19 patients. However, current triaging methods often have poor predictive performance, are based on variables that are expensive to measure, and often lead to hard-to-interpret decisions. We introduce two new classification methods that can predict COVID-19 mortality risk from the automatic analysis of routine clinical variables with high accuracy and interpretability. SVM22-GASS and Clinical-GASS classifiers leverage machine learning methods and clinical expertise, respectively. Both were developed using a derivation cohort of 499 patients from the first wave of the pandemic and were validated with an independent validation cohort of 250 patients from the second pandemic phase. The Clinical-GASS classifier is a threshold-based classifier that leverages the General Assessment of SARS-CoV-2 Severity (GASS) score, a COVID-19-specific clinical score that recently showed its effectiveness in predicting the COVID-19 mortality risk. The SVM22-GASS model is a binary classifier that non-linearly processes clinical data using a Support Vector Machine (SVM). In this study, we show that SMV22-GASS was able to predict the mortality risk of the validation cohort with an AUC of 0.87 and an accuracy of 0.88, better than most scores previously developed. Similarly, the Clinical-GASS classifier predicted the mortality risk of the validation cohort with an AUC of 0.77 and an accuracy of 0.78, on par with other established and emerging machine-learning-based methods. Our results demonstrate the feasibility of accurate COVID-19 mortality risk prediction using only routine clinical variables, readily collected in the early stages of hospital admission.}, doi = {10.3390/biomedicines11030831} }

@article{Rig23-JCS-IJ, article_type = {journal}, title = {Machine Learning Approaches for the Prediction of Gas Turbine Transients}, author = {Fadja, Arnaud Nguembang and Cota, Giuseppe and Bertasi, Francesco and Riguzzi, Fabrizio and Losi, Enzo and Manservigi, Lucrezia and Venturini, Mauro and Bechini, Giovanni}, volume = {20}, number = {5}, year = {2024}, month = {Feb}, pages = {495-510}, doi = {10.3844/jcssp.2024.495.510}, url = {https://thescipub.com/abstract/jcssp.2024.495.510}, abstract = {Gas Turbine (GT) emergency shutdowns can lead to energy production interruption and may also reduce the lifespan of a turbine. In order to remain competitive in the market, it is necessary to improve the reliability and availability of GTs by developing predictive maintenance systems that are able to predict future conditions of GTs within a certain time. Predicting such situations not only helps to take corrective measures to avoid service unavailability but also eases the process of maintenance and considerably reduces maintenance costs. Huge amounts of sensor data are collected from (GTs) making monitoring impossible for human operators even with the help of computers. Machine learning techniques could provide support for handling large amounts of sensor data and building decision models for predicting GT future conditions. The paper presents an application of machine learning based on decision trees and k-nearest neighbors for predicting the rotational speed of gas turbines. The aim is to distinguish steady states (e.g., GT operation at normal conditions) from transients (e.g., GT trip or shutdown). The different steps of a machine learning pipeline, starting from data extraction to model testing are implemented and analyzed. Experiments are performed by applying decision trees, extremely randomized trees, and k-nearest neighbors to sensor data collected from GTs located in different countries. The trained models were able to predict steady state and transient with more than 93% accuracy. This research advances predictive maintenance methods and suggests exploring advanced machine learning algorithms, real-time data integration, and explainable AI techniques to enhance gas turbine behavior understanding and develop more adaptable maintenance systems for industrial applications.}, journal = {Journal of Computer Science}, publisher = {Science Publications} }

*This file was generated by
bibtex2html 1.98.*