de.tudarmstadt.ukp.dkpro.core.api.segmentation.type.Token.getText()方法的使用及代码示例

x33g5p2x  于2022-01-29 转载在 其他  
字(7.9k)|赞(0)|评价(0)|浏览(117)

本文整理了Java中de.tudarmstadt.ukp.dkpro.core.api.segmentation.type.Token.getText()方法的一些代码示例,展示了Token.getText()的具体用法。这些代码示例主要来源于Github/Stackoverflow/Maven等平台,是从一些精选项目中提取出来的代码,具有较强的参考意义,能在一定程度帮忙到你。Token.getText()方法的具体详情如下:
包路径:de.tudarmstadt.ukp.dkpro.core.api.segmentation.type.Token
类名称:Token
方法名:getText

Token.getText介绍

暂无

代码示例

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.stanfordnlp-gpl

@Override
public void process(JCas aJCas)
  throws AnalysisEngineProcessException
{
  if (tempData == null) {
    try {
      tempData = File.createTempFile("dkpro-stanford-pos-trainer", ".tsv");
      out = new PrintWriter(new OutputStreamWriter(new FileOutputStream(tempData),
          StandardCharsets.UTF_8));
    }
    catch (IOException e) {
      throw new AnalysisEngineProcessException(e);
    }
  }
  
  Map<Sentence, Collection<Token>> index = indexCovered(aJCas, Sentence.class, Token.class);
  for (Sentence sentence : select(aJCas, Sentence.class)) {
    Collection<Token> tokens = index.get(sentence);
    for (Token token : tokens) {
      out.printf("%s\t%s%n", token.getText(), token.getPos().getPosValue());
    }
    out.println();
  }
}

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.arktools-gpl

@Override
public void process(JCas jCas) throws AnalysisEngineProcessException {
  if (tempData == null) {
    try {
      tempData = File.createTempFile("dkpro-arktweet-pos-trainer", ".tsv");
      out = new PrintWriter(new OutputStreamWriter(new FileOutputStream(tempData),
          StandardCharsets.UTF_8));
    }
    catch (IOException e) {
      throw new AnalysisEngineProcessException(e);
    }
  }
  Map<Sentence, Collection<Token>> index = indexCovered(jCas, Sentence.class, Token.class);
  for (Sentence sentence : select(jCas, Sentence.class)) {
    Collection<Token> tokens = index.get(sentence);
    for (Token token : tokens) {
      out.printf("%s\t%s%n", token.getText(), token.getPos().getPosValue());
    }
    out.println();
  }
}

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.treetagger-asl

@Override
  public String getText(Token aToken)
  {
    synchronized (aToken.getCAS()) {
      String pos = mapping.get(aToken.getPosValue());
      if (pos == null) {
        pos = aToken.getPosValue();
      }
      
      return aToken.getText() + "-" + pos;
    }
  }
}

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.opennlp-asl

@Override
  public POSSample produce(JCas aJCas)
  {
    // Process present sentences
    Sentence sentence = sentences.next();
    
    // Block on next call to read
    if (!sentences.hasNext()) {
      documentComplete();
    }
    
    List<String> words = new ArrayList<>();
    List<String> tags = new ArrayList<>();
    
    for (Token t : selectCovered(Token.class, sentence)) {
      words.add(t.getText());
      if (t.getPos() == null) {
        throw new IllegalStateException("Token [" + t.getText() + "] has no POS");
      }
      tags.add(t.getPos().getPosValue());
    }
    
    return new POSSample(words, tags);
  }
}

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.opennlp-asl

@Override
  public ChunkSample produce(JCas aJCas)
  {
    // Process present sentences
    Sentence sentence = sentences.next();
    
    // Block on next call to read
    if (!sentences.hasNext()) {
      documentComplete();
    }
    
    List<String> words = new ArrayList<>();
    List<String> tags = new ArrayList<>();
    List<String> preds = new ArrayList<>();
    
    for (Token t : selectCovered(Token.class, sentence)) {
      words.add(t.getText());
      if (t.getPos() == null) {
        throw new IllegalStateException("Token [" + t.getText() + "] has no POS");
      }
      tags.add(t.getPos().getPosValue());
      preds.add(chunkEncoder.encode(t));
    }
    
    return new ChunkSample(words, tags, preds);
  }
}

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.opennlp-asl

words.add(t.getText());
  throw new IllegalStateException("Token [" + t.getText() + "] has no POS");
  throw new IllegalStateException("Token [" + t.getText() + "] has no lemma");

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.io.conll-asl

String form = row.token.getCoveredText();
if (!writeCovered) {
  form = row.token.getText();

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.dictionaryannotator-asl

sentenceToEnd[j] = tokensToSentenceEnd.get(j).getText();

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.arktools-gpl

private List<TaggedToken> tagTweetTokens(List<Token> annotatedTokens,
      TweetTagger tweetTagModel)
  {

    List<String> tokens = new LinkedList<String>();
    for (Token a : annotatedTokens) {
      String tokenText = a.getText();
      tokenText = Twokenize.normalizeTextForTagger(tokenText);
      tokens.add(tokenText);
    }

    Sentence sentence = new Sentence();
    sentence.tokens = tokens;
    ModelSentence ms = new ModelSentence(sentence.T());
    tweetTagModel.featureExtractor.computeFeatures(sentence, ms);
    tweetTagModel.model.greedyDecode(ms, false);

    ArrayList<TaggedToken> taggedTokens = new ArrayList<TaggedToken>();

    for (int t = 0; t < sentence.T(); t++) {
      TaggedToken tt = new TaggedToken();
      tt.token = annotatedTokens.get(t);
      tt.tag = tweetTagModel.model.labelVocab.name(ms.labels[t]);
      taggedTokens.add(tt);
    }
    return taggedTokens;
  }
}

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.io.conll-asl

String form = row.token.getCoveredText();
if (!writeCovered) {
  form = row.token.getText();

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.tokit-asl

if (token.getPos().getPosValue().matches("PTKVZ.*")) {
  String particle = token.getText();
  String verblemma = "";

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.matetools-gpl

Token token = tokens.get(i);
if (lemmas[i] == null) {
  lemmas[i] = token.getText();

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.opennlp-asl

int i = 0;
for (Token t : tokens) {
  tokenTexts[i] = t.getText();
  if (t.getPos() == null || t.getPos().getPosValue() == null) {
    throw new IllegalStateException("Every token must have a POS tag.");

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.opennlp-asl

toks[i] = t.getText();
tags[i] = t.getPosValue();
i++;

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.clearnlp-asl

DEPNode node = new DEPNode(i + 1, tokens.get(i).getText());
node.pos = t.getPos().getPosValue();
tree.add(node);
String lemmaString = node.lemma;
if (lemmaString == null) {
  lemmaString = t.getText();

代码示例来源:origin: dkpro/dkpro-core

@Override
public void process(final JCas aJCas)
  throws AnalysisEngineProcessException
{
  for (Token token : select(aJCas, Token.class)) {
    final String coveredText = token.getText();
    DecompoundedWord result;
    result = ranker.highestRank(splitter.split(coveredText));
    if (!result.isCompound()) {
      continue;
    }
    final int beginIndex = token.getBegin();
    final Compound compound = new Compound(aJCas, beginIndex, token.getEnd());
    indexSplits(aJCas, result.getSplits(), beginIndex, token.getEnd(), null, compound);
    compound.addToIndexes();
  }
}

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.stanfordnlp-gpl

words.add(new TaggedWord(t.getText()));

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.stanfordnlp-gpl

public static CoreLabel tokenToWord(Token aToken)
{
  CoreLabel t = new CoreLabel();
  
  t.setOriginalText(aToken.getCoveredText());
  t.setWord(aToken.getText());
  t.setBeginPosition(aToken.getBegin());
  t.setEndPosition(aToken.getEnd());
  
  if (aToken.getLemma() != null) {
    t.setLemma(aToken.getLemma().getValue());
  }
  else {
    t.setLemma(aToken.getText());
  }
  
  if (aToken.getPos() != null) {
    t.setTag(aToken.getPos().getPosValue());
  }
  
  return t;
}

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.tokit-asl

/**
   * Process the sentence to create tokens.
   */
  private void processSentence(JCas aJCas, String text, int zoneBegin)
  {
    BreakIterator bi = BreakIterator.getWordInstance(getLocale(aJCas));
    bi.setText(text);
    int last = bi.first() + zoneBegin;
    int cur = bi.next();
    while (cur != BreakIterator.DONE) {
      cur += zoneBegin;
      Token token = createToken(aJCas, last, cur);
      if (token != null) {
        if (splitAtApostrophe) {
          int i = token.getText().indexOf("'");
          if (i > 0) {
            i += token.getBegin();
            createToken(aJCas, i, token.getEnd());
            token.setEnd(i);
          }
        }
      }

      last = cur;
      cur = bi.next();
    }
  }
}

代码示例来源:origin: de.tudarmstadt.ukp.dkpro.core/de.tudarmstadt.ukp.dkpro.core.clearnlp-asl

DEPNode node = new DEPNode(i + 1, tokens.get(i).getText());
node.pos = t.getPos().getPosValue();
if (t.getLemma() != null) {

相关文章