Package edu.harvard.wcfia.yoshikoder.document

Examples of edu.harvard.wcfia.yoshikoder.document.TokenStructuredDocument


   
    YKDocument doc1 = YKDocumentFactory.createYKDocument(new File("/Users/will/Desktop/bundestagdebate/14235.txt"),
        "doc1", "UTF-8", Locale.GERMAN);
    YKDocument doc2 = YKDocumentFactory.createYKDocument(new File("/Users/will/Desktop/bundestagdebate/14235.txt"),
        "doc2", "UTF-8", Locale.GERMAN);
    TokenStructuredDocument tsdoc1 = new TokenStructuredDocument(doc1);
    TokenStructuredDocument tsdoc2 = new TokenStructuredDocument(doc2);
    String[][] conc1 = tsdoc1.getPatternConcordance(Pattern.compile("vier"), 5);
    String[][] conc2 = tsdoc2.getPatternConcordance(Pattern.compile("vier"), 5);

    for (int ii = 0; ii < conc1.length; ii++) {
      for (int jj = 0; jj < conc1[ii].length; jj++) {
       
        System.out.print("[" + conc1[ii][jj] + "]");
View Full Code Here


    if (rowIndex == -1)
      return;
   
    DocumentConcordanceTableModel dctm = (DocumentConcordanceTableModel)getModel();
    int[] span = dctm.getCharacterOffsetsForConcordanceRow(rowIndex);
    TokenStructuredDocument doc = dctm.getDocumentForConcordanceRow(rowIndex);
   
    System.err.println("Make character span [" + span[0] + ", " + span[1] + "] in document '" + doc.getTitle() + "' visible");
  }
View Full Code Here

    YKDocument doc1 = YKDocumentFactory.createYKDocument(new File("/Users/will/Documents/german-manifestos-econ/ORIG_ECON_CDU1990.txt"),
        "CDU91990", "ISO-8859-1", Locale.GERMAN);
    YKDocument doc2 = YKDocumentFactory.createYKDocument(new File("/Users/will/Documents/german-manifestos-econ/ORIG_ECON_CDU1994.txt"),
        "CDU91994", "ISO-8859-1", Locale.GERMAN);

    TokenStructuredDocument tsd1 = new TokenStructuredDocument(doc1);
    TokenStructuredDocument tsd2 = new TokenStructuredDocument(doc2);

    List<TokenStructuredDocument> lst = new ArrayList<TokenStructuredDocument>();
    lst.add(tsd1);
    lst.add(tsd2);
View Full Code Here

  }

  public static void main(String[] args) throws IOException {
    YKDocument d1 = YKDocumentFactory.createDummyDocument("dummy1", "1 2 3 4 5 6 7 8 9", "UTF-8");
    YKDocument d2 = YKDocumentFactory.createDummyDocument("dummy2", "5 6 7 8 9 10 11 12", "UTF-8");
    TokenStructuredDocument tsd1 = new TokenStructuredDocument(d1);
    TokenStructuredDocument tsd2 = new TokenStructuredDocument(d2);
    Pattern[] p5 = new Pattern[]{Pattern.compile("9")};
    Pattern[] p34 = new Pattern[]{Pattern.compile("2"), Pattern.compile("3"), Pattern.compile("4")};
    List<TokenStructuredDocument> dlist = new ArrayList<TokenStructuredDocument>();
    dlist.add(tsd1);
    dlist.add(tsd2);
View Full Code Here

TOP

Related Classes of edu.harvard.wcfia.yoshikoder.document.TokenStructuredDocument

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.