tools.conf 924 B

123456789101112131415161718192021222324252627282930313233343536
  1. [options]
  2. # Possible values for validate:
  3. # - all: perform full validation
  4. # - none: don't perform any validation
  5. Validation validate:none
  6. # Possible values for tokenizer
  7. # - ptblike: emulate Penn Treebank tokenization
  8. # - mecab: perform Japanese tokenization using MeCab
  9. # - whitespace: split by whitespace characters in source text (only)
  10. Tokens tokenizer:whitespace
  11. # Possible values for splitter:
  12. # - regex : regular expression-based sentence splitting
  13. # - newline: split by newline characters in source text (only)
  14. Sentences splitter:newline
  15. # Possible values for logfile:
  16. # - <NONE> : no annotation logging
  17. # - NAME : log into file NAME (e.g. "/home/brat/annotation.log")
  18. Annotation-log logfile:<NONE>
  19. [search]
  20. Google <URL>:http://www.google.com/search?q=%s
  21. Wikipedia <URL>:http://en.wikipedia.org/wiki/Special:Search?search=%s
  22. [annotators]
  23. # none
  24. [disambiguators]
  25. # none
  26. [normalization]
  27. # none