public class ResultSetImpl_TopDocs implements ResultSet {

  protected boolean normalize = true;

  protected String keyword = null;

  protected SchemaFactory schemaFactory = SchemaFactoryImpl.getInstance();

  protected int topcount;

  protected DocStream resultStream;

  protected IndexReader indexReader = null;

  protected TopDocs topDocs;

  protected ResultSetImpl_TopDocs(DocStream resultStream, IndexReader indexReader)
      throws Exception {
    this(resultStream, indexReader, 50, true);
  }

  protected ResultSetImpl_TopDocs(
      DocStream resultStream, IndexReader indexReader, int topCount, boolean normalize)
      throws Exception {
    this.normalize = normalize;
    this.resultStream = resultStream;
    this.indexReader = indexReader;
    topcount = topCount;
    generateTopDocs();
  }

  private TopDocCollector collector;

  private void generateTopDocs() throws Exception {
    collector = new TopDocCollector(topcount);
    resultStream.init();
    for (int i = 0; i < resultStream.getLen(); i++) {
      collector.collect(resultStream.doc(), (float) (resultStream.score()));
      resultStream.next();
    }
    ;
    topDocs = collector.topDocs();
  }

  public int getDocID(int index) throws Exception {
    if (index >= topcount) {
      topcount = index * 2;
      generateTopDocs();
    }
    return topDocs.scoreDocs[index].doc;
  }

  public int getEstimatedNumberOfCompleteResults() {
    return resultStream.getLen();
  }

  public int getLength() {
    return resultStream.getLen();
  }

  protected SchemaObjectInfo getInfo(IndexReader indexReader, int docID) throws IOException {
    FieldType[] fields =
        new FieldType[] {
          FieldType.ID, FieldType.URI, FieldType.LABEL, FieldType.SUMMARY, FieldType.TEXT
        };
    String[] values = indexReader.getFieldValues(docID, fields);
    return schemaFactory.createSchemaObjectInfo(
        Long.valueOf(values[0]), values[1], values[2], values[3], values[4]);
  }

  public SchemaObjectInfo getResult(int index) throws Exception {
    int id = getDocID(index);
    return getInfo(indexReader, id);
  }

  public double getScore(int index) throws Exception {
    getDocID(index);
    if (normalize) return topDocs.scoreDocs[index].score / topDocs.scoreDocs[0].score;
    else return topDocs.scoreDocs[index].score;
  }

  public String getSnippet(int index) throws Exception {
    StandardAnalyzer analyzer = new StandardAnalyzer();
    QueryParser qp = new QueryParser(FieldType.TEXT.toString(), analyzer);
    SchemaObjectInfo info = getResult(index);
    String text = info.getTextDescription();
    String label = info.getLabel().toLowerCase();
    // remove abundant labels
    if (!label.equals("")) {
      while (text.indexOf(label) == 0) text = text.substring(label.length()).trim();
    }

    if (keyword != null) {
      try {
        Highlighter hl = new Highlighter(new QueryScorer(qp.parse(keyword)));
        TokenStream ts = analyzer.tokenStream(text, new StringReader(text));
        String snippet = hl.getBestFragment(ts, text);
        if (snippet != null) return snippet;
      } catch (Exception e) {
        //				e.printStackTrace();
      }
    }
    return text;
  }

  public ResultSet setSnippetKeyword(String keyword) {
    this.keyword = keyword;
    return this;
  }

  public DocStream getResultStream() throws IOException {
    return resultStream;
  }
}
Пример #2
0
public class ForServlet {
  DOMParser parser = new DOMParser();

  XFacetedSearchable searcher = null;

  SchemaFactory schemaFactory = SchemaFactoryImpl.getInstance();

  SearchFactory searchFactory = SearchFactoryImpl.getInstance();

  Hashtable<String, XFacetedResultSet> resultCache = new Hashtable<String, XFacetedResultSet>();

  private GeneralCategory createGeneralCategory(Node node)
      throws NoSuchAlgorithmException, DOMException {
    NamedNodeMap map = node.getAttributes();
    CompoundCategory cat = schemaFactory.createCompoundCategory(CompoundCategory.TYPE_AND);
    Node n = map.getNamedItem("instanceConstraint");
    if (n != null && !n.getNodeValue().equals("")) {
      cat.addComponentCategory(
          schemaFactory
              .createEnumerationCategory()
              .addInstanceElement(schemaFactory.createInstance(n.getNodeValue())));
      return cat;
    }
    n = map.getNamedItem("conceptConstraint");
    if (n != null && !n.getNodeValue().equals("")) {
      cat.addComponentCategory(schemaFactory.createCategory(n.getNodeValue()));
    }
    n = map.getNamedItem("keyword");
    if (n != null && !n.getNodeValue().equals("")) {
      cat.addComponentCategory(schemaFactory.createKeywordCategory(n.getNodeValue()));
    }
    return cat;
  }

  private void addRelations(CatRelGraph graph, int fromNodeIndex, NodeList nodes)
      throws NoSuchAlgorithmException, DOMException {
    if (nodes == null) return;
    for (int i = 0; i < nodes.getLength(); i++) {
      Node node = nodes.item(i);
      if (node.getNodeName().equals("#text")) continue;
      // System.out.println("name="+node.getNodeName());
      graph.add(createGeneralCategory(node));
      int toNodeIndex = graph.numOfNodes() - 1;
      NamedNodeMap map = node.getAttributes();
      if (map.getNamedItem("inverse").getNodeValue().equals("0")) {
        graph.add(
            schemaFactory.createRelation(map.getNamedItem("relation").getNodeValue()),
            fromNodeIndex,
            toNodeIndex);
      } else {
        graph.add(
            schemaFactory.createRelation(map.getNamedItem("relation").getNodeValue()),
            toNodeIndex,
            fromNodeIndex);
      }
      addRelations(graph, toNodeIndex, node.getChildNodes());
    }
  }

  private XFacetedQuery XML2Query(Document doc) {
    try {
      Node node = null;
      NamedNodeMap map = null;

      node = doc.getElementsByTagName("action").item(0);
      map = node.getAttributes();

      // create XFacetedQuery
      node = doc.getElementsByTagName("targetNode").item(0);
      map = node.getAttributes();
      int target = new Integer(map.getNamedItem("index").getNodeValue()).intValue();

      CatRelGraph graph = schemaFactory.createCatRelGraph();
      node = doc.getElementsByTagName("queryNode").item(0);
      graph.add(createGeneralCategory(node));
      // System.out.println("name="+node.getNodeName());
      addRelations(graph, 0, node.getChildNodes());
      System.out.println(graph);
      System.out.println("target=" + target);

      XFacetedQuery query = searchFactory.createXFacetedQuery();
      query.setSearchTarget(target);
      query.setQueryConstraint(graph);
      query.setResultSpec(searchFactory.createXFacetedResultSpec());
      return query;
    } catch (Exception ex) {
      ex.printStackTrace();
    }
    return null;
  }

  private String nomalizeLabel(String label) {
    return label.replaceAll("[0-9]*", "").replaceFirst("Category:", "");
  }

  private String result2XML(XFacetedResultSet resultSet, Document doc2, long queryTime) {
    try {
    } catch (Exception ex) {
      System.out.println(ex);
    }
    try {
      Node node = null;
      NamedNodeMap map = null;
      node = doc2.getElementsByTagName("action").item(0);
      map = node.getAttributes();

      DocumentBuilderFactory dbf = DocumentBuilderFactory.newInstance();
      DocumentBuilder db = dbf.newDocumentBuilder();
      Document doc = db.newDocument();
      Element root = doc.createElement("result"); // Create Root Element
      if (map.getNamedItem("type").getNodeValue().equals("all")
          || map.getNamedItem("type").getNodeValue().equals("instanceList")) {
        Element item = doc.createElement("instanceList"); // Create
        // element
        item.setAttribute("count", Integer.toString(resultSet.getLength()));
        item.setAttribute("time", Long.toString(queryTime));
        int start = new Integer(map.getNamedItem("start").getNodeValue()).intValue();
        int count = new Integer(map.getNamedItem("count").getNodeValue()).intValue();
        int end = start + count;
        if (end > resultSet.getLength()) end = resultSet.getLength();
        for (int i = start; i < end; i++) {
          SchemaObjectInfo result = resultSet.getResult(i);
          Element subitem = doc.createElement("instance");
          try {
            subitem.setAttribute("name", java.net.URLDecoder.decode(result.getLabel()));
          } catch (Exception e) {
            subitem.setAttribute("name", result.getLabel());
          }
          subitem.setAttribute("uri", result.getURI());
          // subitem.setAttribute("snippet",
          // result.getTextDescription());
          try {
            subitem.setAttribute("snippet", java.net.URLDecoder.decode(resultSet.getSnippet(i)));
          } catch (Exception e) {
            subitem.setAttribute("snippet", resultSet.getSnippet(i));
          }
          item.appendChild(subitem);

          // for debug
          // System.out.println("result "+i+":
          // "+resultSet.getResult(i).getLabel());
          // System.out.println("//score:"+resultSet.getScore(i));
          // System.out.println("//uri:"+resultSet.getResult(i).getURI());
          // System.out.println("//id:"+resultSet.getDocID(i));
          // System.out.println("//text:"+resultSet.getResult(i).getTextDescription());
          // System.out.println("//text:"+resultSet.getSnippet(i));
          // for debug
        }
        root.appendChild(item); // atach element to Root element
      }

      if (map.getNamedItem("type").getNodeValue().equals("all")
          || map.getNamedItem("type").getNodeValue().equals("conceptList")) {
        Element item = doc.createElement("conceptList"); // Create
        // element
        int start = new Integer(map.getNamedItem("start").getNodeValue()).intValue();
        int count = new Integer(map.getNamedItem("count").getNodeValue()).intValue();
        int end = start + count;
        Facet[] facets = resultSet.getCategoryFacets();
        if (end > facets.length) end = facets.length;
        item.setAttribute("count", Integer.toString(facets.length));
        for (int i = start; i < end; i++) {
          Facet result = facets[i];
          Element subitem = doc.createElement("concept");
          subitem.setAttribute("name", nomalizeLabel(result.getInfo().getLabel()));
          subitem.setAttribute("uri", result.getInfo().getURI());
          subitem.setAttribute("count", String.valueOf(result.getCount()));
          item.appendChild(subitem);
        }
        root.appendChild(item); // atach element to Root element
      }

      if (map.getNamedItem("type").getNodeValue().equals("all")
          || map.getNamedItem("type").getNodeValue().equals("relationList")) {
        Element item = doc.createElement("relationList"); // Create
        // element
        int start = new Integer(map.getNamedItem("start").getNodeValue()).intValue();
        int count = new Integer(map.getNamedItem("count").getNodeValue()).intValue();
        int end = start + count;
        Facet[] facets = resultSet.getRelationFacets();
        if (end > facets.length) end = facets.length;
        item.setAttribute("count", Integer.toString(facets.length));
        for (int i = start; i < end; i++) {
          Facet result = facets[i];
          Element subitem = doc.createElement("relation");
          subitem.setAttribute("name", result.getInfo().getLabel());
          subitem.setAttribute("uri", result.getInfo().getURI());
          subitem.setAttribute("count", String.valueOf(result.getCount()));
          if (result.isInverseRelation()) subitem.setAttribute("inverse", "1");
          else subitem.setAttribute("inverse", "0");
          item.appendChild(subitem);
        }
        root.appendChild(item); // atach element to Root element
      }

      doc.appendChild(root); // Add Root to Document
      OutputFormat format = new OutputFormat(doc); // Serialize DOM
      StringWriter stringOut = new StringWriter(); // Writer will be a
      // String
      XMLSerializer serial = new XMLSerializer(stringOut, format);
      serial.asDOMSerializer(); // As a DOM Serializer
      serial.serialize(doc.getDocumentElement());
      // System.out.println( "STRXML = " + stringOut.toString() ); //Spit
      // out DOM as a String
      return stringOut.toString();
    } catch (Exception ex) {
      ex.printStackTrace();
    }

    return null;
  }

  public String query(String queryXML, String uid) {
    return query(new InputSource(new StringReader(queryXML)), uid);
  }

  public String query(File queryXMLFile, String uid) {
    try {
      return query(new InputSource(new FileReader(queryXMLFile)), uid);
    } catch (Exception e) {
      e.printStackTrace();
    }
    return null;
  }

  public String query(InputSource input, String uid) {
    try {
      XFacetedResultSet resultSet = null;

      parser.parse(input);
      Document doc = parser.getDocument();
      Node node = null;
      NamedNodeMap map = null;

      long time_b = System.currentTimeMillis();
      // create result set
      node = doc.getElementsByTagName("action").item(0);
      map = node.getAttributes();
      if (map.getNamedItem("type").getNodeValue().equals("all")) { // a new
        // query
        XFacetedQuery query = XML2Query(doc);

        time_b = System.currentTimeMillis();
        resultSet = searcher.search(query);
        resultCache.put(uid, resultSet);
      } else { // "more_instance","more_concept","more_relation"
        resultSet = resultCache.get(uid);
        if (resultSet == null) {
          XFacetedQuery query = XML2Query(doc);
          // System.out.println(query);

          time_b = System.currentTimeMillis();
          resultSet = searcher.search(query);
        }
      }

      long time_e = System.currentTimeMillis();
      long queryTime = time_e - time_b;

      // result set to xml
      return result2XML(resultSet, doc, queryTime);
    } catch (Exception ex) {
      ex.printStackTrace();
    }
    return null;
  }

  public void init(String configFile) throws Exception {
    Properties config = Config.readConfigFile(configFile);
    XFacetedSearchService searchService = searchFactory.getXFacetedSearchService(config);
    searcher = searchService.getXFacetedSearchable();
  }

  public static void main(String[] args) {
    try {
      ForServlet forServ = new ForServlet();
      String configFile =
          args[0]; // "E:\\User\\AllisQM\\Semplore\\SSModel\\config\\semplore-dbpedia-yago.cfg";
      forServ.init(configFile); // config file
      String queryXML =
          "<?xml version=\"1.0\" encoding=\"UTF-8\"?><query>"
              + "  <action type=\"all\" start=\"0\" count=\"10\"/>"
              + "  <graph>"
              + "    <queryNode insName=\"\" instanceConstraint=\"\" relName=\"\" relation=\"\" inverse=\"0\" conName=\"\" conceptConstraint=\"\" keyword=\"academy award\">"
              + "      <queryNode relation=\"&lt;http://dbpedia.org/property/starring>\" inverse=\"0\" relName=\"starring\" insName=\"\" conceptConstraint=\"\" instanceConstraint=\"\" keyword=\"star wars\"/>"
              + "      <queryNode relation=\"&lt;http://dbpedia.org/property/director>\" inverse=\"0\" relName=\"director\" insName=\"\" conceptConstraint=\"&lt;http://dbpedia.org/resource/Category:Jewish_American_film_directors>\" instanceConstraint=\"\" keyword=\"\" conName=\"TOP Category\"/>"
              + "    </queryNode>"
              + "  </graph>"
              + "  <targetNode index=\"2\"/>"
              + "</query>";
      String uid = "127.0.0.1";
      String resultXML = forServ.query(queryXML, uid);
      System.out.println("uid:" + uid);
      System.out.println("queryXML:" + queryXML);
      System.out.println("resultXML:" + resultXML);
    } catch (Exception e) {
      e.printStackTrace();
    }
  }
}