Snippet of code
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 | /* * Copyright or © or Copr. Ecole des Mines d'Alès (2012-2014) * * This software is a computer program whose purpose is to provide * several functionalities for the processing of semantic data * sources such as ontologies or text corpora. * * This software is governed by the CeCILL license under French law and * abiding by the rules of distribution of free software. You can use, * modify and/ or redistribute the software under the terms of the CeCILL * license as circulated by CEA, CNRS and INRIA at the following URL * * As a counterpart to the access to the source code and rights to copy, * modify and redistribute granted by the license, users are provided only * with a limited warranty and the software's author, the holder of the * economic rights, and the successive licensors have only limited * liability. * In this respect, the user's attention is drawn to the risks associated * with loading, using, modifying and/or developing or reproducing the * software by the user in light of its specific status of free software, * that may mean that it is complicated to manipulate, and that also * therefore means that it is reserved for developers and experienced * professionals having in-depth computer knowledge. Users are therefore * encouraged to load and test the software's suitability as regards their * requirements in conditions enabling the security of their systems and/or * data to be ensured and, more generally, to use and operate it in the * same conditions as regards security. * * The fact that you are presently reading this means that you have had * knowledge of the CeCILL license and that you accept its terms. */ package slib.examples.sml.go; import org.openrdf.model.URI; import slib.graph.algo.utils.GraphActionExecutor; import slib.graph.algo.utils.GAction; import slib.graph.algo.utils.GActionType; import slib.graph.io.conf.GDataConf; import slib.graph.io.loader.GraphLoaderGeneric; import slib.graph.io.util.GFormat; import slib.graph.model.graph.G; import slib.graph.model.impl.graph.memory.GraphMemory; import slib.graph.model.impl.repo.URIFactoryMemory; import slib.graph.model.repo.URIFactory; import slib.sml.sm.core.metrics.ic.utils.IC_Conf_Topo; import slib.sml.sm.core.metrics.ic.utils.ICconf; import slib.sml.sm.core.utils.SMConstants; import slib.sml.sm.core.engine.SM_Engine; import slib.sml.sm.core.utils.SMconf; import slib.utils.ex.SLIB_Exception; /** * * Example of a Semantic measure computation using the Semantic Measures * Library. In this snippet we estimate the similarity of two concepts expressed * in the Gene Ontology. The Gene Ontology is expressed in OBO format. The * similarity is estimated using Lin's measure. * * More information at http://www.semantic-measures-library.org/ * * Note that you can set the LOG level in specified in log4j.xml, e.g. in root * element, change value="INFO" to value="DEBUG" * * @author Sébastien Harispe <sebastien.harispe@gmail.com> */ public class SMComputationGO_pairwise { public static void main(String[] params) throws SLIB_Exception { // Configuration files, set the file path according to your configuration. // The Gene Ontology (OBO format) String goOBO = "/data/go/gene_ontology_ext.obo" ; URIFactory factory = URIFactoryMemory.getSingleton(); // We define a prefix in order to build valid uris from ids such as GO:XXXXX, // considering the configuration specified below the URI associated to GO:XXXXX will be http://go/XXXXX factory.loadNamespacePrefix( "GO" , graph_uri.toString()); G graph = new GraphMemory(graph_uri); GDataConf graphconf = new GDataConf(GFormat.OBO, goOBO); GraphLoaderGeneric.populate(graphconf, graph); // General information about the graph System.out.println(graph.toString()); // The Gene Ontology is not rooted, i.e. Molecular Function, Biological Process, Cellular Component, the three sub-ontologies of // the GO are not rooted. We create such a virtual root in order to be able to compare // the concepts expressed in different sub-ontologies. // We create a vertex corresponding to the virtual root // and we add it to the graph graph.addV(virtualRoot); // We root the graphs using the virtual root as root GAction rooting = new GAction(GActionType.REROOTING); rooting.addParameter( "root_uri" , virtualRoot.stringValue()); GraphActionExecutor.applyAction(factory, rooting, graph); System.out.println(graph.toString()); int nbVertices = graph.getV().size(); System.out.println( "Nb vertices : " + nbVertices); // We compute the similarity between http://go/0071869 and the collection of vertices ICconf icConf = new IC_Conf_Topo( "Sanchez" , SMConstants.FLAG_ICI_SANCHEZ_2011); // Then we define the Semantic measure configuration SMconf smConf = new SMconf( "Lin" , SMConstants.FLAG_SIM_PAIRWISE_DAG_NODE_LIN_1998); smConf.setICconf(icConf); SM_Engine engine = new SM_Engine(graph); double sim; for (URI v : graph.getV()) { sim = engine.compare(smConf, concept, v); System.out.println(concept+ "\t" +v+ "\t" +sim); } } } |