├── .gitignore ├── .travis.yml ├── LICENSE ├── MANIFEST.in ├── README.rst ├── corenlp_protobuf ├── CoreNLP_pb2.py └── __init__.py ├── doc └── CoreNLP.proto ├── setup.cfg ├── setup.py ├── tests ├── __init__.py ├── data │ └── test.dat └── test_read.py └── tox.ini /.gitignore: -------------------------------------------------------------------------------- 1 | # Byte-compiled / optimized / DLL files 2 | __pycache__/ 3 | *.py[cod] 4 | *$py.class 5 | 6 | # C extensions 7 | *.so 8 | 9 | # Distribution / packaging 10 | .Python 11 | env/ 12 | build/ 13 | develop-eggs/ 14 | dist/ 15 | downloads/ 16 | eggs/ 17 | .eggs/ 18 | lib/ 19 | lib64/ 20 | parts/ 21 | sdist/ 22 | var/ 23 | *.egg-info/ 24 | .installed.cfg 25 | *.egg 26 | 27 | # PyInstaller 28 | # Usually these files are written by a python script from a template 29 | # before PyInstaller builds the exe, so as to inject date/other infos into it. 30 | *.manifest 31 | *.spec 32 | 33 | # Installer logs 34 | pip-log.txt 35 | pip-delete-this-directory.txt 36 | 37 | # Unit test / coverage reports 38 | htmlcov/ 39 | .tox/ 40 | .coverage 41 | .coverage.* 42 | .cache 43 | nosetests.xml 44 | coverage.xml 45 | *,cover 46 | .hypothesis/ 47 | 48 | # Translations 49 | *.mo 50 | *.pot 51 | 52 | # Django stuff: 53 | *.log 54 | local_settings.py 55 | 56 | # Flask stuff: 57 | instance/ 58 | .webassets-cache 59 | 60 | # Scrapy stuff: 61 | .scrapy 62 | 63 | # Sphinx documentation 64 | docs/_build/ 65 | 66 | # PyBuilder 67 | target/ 68 | 69 | # IPython Notebook 70 | .ipynb_checkpoints 71 | 72 | # pyenv 73 | .python-version 74 | 75 | # celery beat schedule file 76 | celerybeat-schedule 77 | 78 | # dotenv 79 | .env 80 | 81 | # virtualenv 82 | venv/ 83 | ENV/ 84 | 85 | # Spyder project settings 86 | .spyderproject 87 | 88 | # Rope project settings 89 | .ropeproject 90 | -------------------------------------------------------------------------------- /.travis.yml: -------------------------------------------------------------------------------- 1 | language: python 2 | python: 3 | - 2.7 4 | - 3.5 5 | notifications: 6 | email: false 7 | before_install: 8 | - sudo apt-get update 9 | install: 10 | - pip install tox-travis 11 | # Run test 12 | script: 13 | - tox 14 | # only integrate the master branch 15 | branches: 16 | only: 17 | - master 18 | -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- 1 | MIT License 2 | 3 | Copyright (c) 2017 Stanford NLP 4 | 5 | Permission is hereby granted, free of charge, to any person obtaining a copy 6 | of this software and associated documentation files (the "Software"), to deal 7 | in the Software without restriction, including without limitation the rights 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 9 | copies of the Software, and to permit persons to whom the Software is 10 | furnished to do so, subject to the following conditions: 11 | 12 | The above copyright notice and this permission notice shall be included in all 13 | copies or substantial portions of the Software. 14 | 15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 21 | SOFTWARE. 22 | -------------------------------------------------------------------------------- /MANIFEST.in: -------------------------------------------------------------------------------- 1 | # Include the license file 2 | include *.md 3 | include LICENSE 4 | 5 | # Include the data files 6 | recursive-include corenlp_protobuf *.py 7 | recursive-include doc *.proto 8 | -------------------------------------------------------------------------------- /README.rst: -------------------------------------------------------------------------------- 1 | Stanford CoreNLP Python Bindings 2 | ================================ 3 | 4 | .. image:: https://travis-ci.org/stanfordnlp/python-corenlp-protobuf.svg?branch=master 5 | :target: https://travis-ci.org/stanfordnlp/python-corenlp-protobuf 6 | 7 | This package contains python bindings for `Stanford 8 | CoreNLP `_'s protobuf 9 | specifications, as generated by `protoc`. These bindings can used to 10 | parse binary data produced by, e.g., the `Stanford CoreNLP 11 | server `_. 12 | 13 | ---- 14 | 15 | Usage: 16 | 17 | .. code-block:: python 18 | 19 | from corenlp_protobuf import Document, parseFromDelimitedString 20 | 21 | # document.dat contains a serialized Document. 22 | with open('document.dat', 'r') as f: 23 | buf = f.read() 24 | doc = Document() 25 | parseFromDelimitedString(doc, buf) 26 | 27 | # You can access the sentences from doc.sentence. 28 | sentence = doc.sentence[0] 29 | 30 | # You can access any property within a sentence. 31 | print(sentence.text) 32 | 33 | # Likewise for tokens 34 | token = sentence.token[0] 35 | print(token.lemma) 36 | 37 | See `test_read.py` for more examples. 38 | -------------------------------------------------------------------------------- /corenlp_protobuf/CoreNLP_pb2.py: -------------------------------------------------------------------------------- 1 | # Generated by the protocol buffer compiler. DO NOT EDIT! 2 | # source: CoreNLP.proto 3 | 4 | import sys 5 | _b=sys.version_info[0]<3 and (lambda x:x) or (lambda x:x.encode('latin1')) 6 | from google.protobuf.internal import enum_type_wrapper 7 | from google.protobuf import descriptor as _descriptor 8 | from google.protobuf import message as _message 9 | from google.protobuf import reflection as _reflection 10 | from google.protobuf import symbol_database as _symbol_database 11 | from google.protobuf import descriptor_pb2 12 | # @@protoc_insertion_point(imports) 13 | 14 | _sym_db = _symbol_database.Default() 15 | 16 | 17 | 18 | 19 | DESCRIPTOR = _descriptor.FileDescriptor( 20 | name='CoreNLP.proto', 21 | package='edu.stanford.nlp.pipeline', 22 | syntax='proto2', 23 | serialized_pb=_b('\n\rCoreNLP.proto\x12\x19\x65\x64u.stanford.nlp.pipeline\"\xe1\x05\n\x08\x44ocument\x12\x0c\n\x04text\x18\x01 \x02(\t\x12\x35\n\x08sentence\x18\x02 \x03(\x0b\x32#.edu.stanford.nlp.pipeline.Sentence\x12\x39\n\ncorefChain\x18\x03 \x03(\x0b\x32%.edu.stanford.nlp.pipeline.CorefChain\x12\r\n\x05\x64ocID\x18\x04 \x01(\t\x12\x0f\n\x07\x64ocDate\x18\x07 \x01(\t\x12\x10\n\x08\x63\x61lendar\x18\x08 \x01(\x04\x12;\n\x11sentencelessToken\x18\x05 \x03(\x0b\x32 .edu.stanford.nlp.pipeline.Token\x12\x33\n\tcharacter\x18\n \x03(\x0b\x32 .edu.stanford.nlp.pipeline.Token\x12/\n\x05quote\x18\x06 \x03(\x0b\x32 .edu.stanford.nlp.pipeline.Quote\x12\x37\n\x08mentions\x18\t \x03(\x0b\x32%.edu.stanford.nlp.pipeline.NERMention\x12#\n\x1bhasEntityMentionsAnnotation\x18\r \x01(\x08\x12\x0e\n\x06xmlDoc\x18\x0b \x01(\x08\x12\x34\n\x08sections\x18\x0c \x03(\x0b\x32\".edu.stanford.nlp.pipeline.Section\x12<\n\x10mentionsForCoref\x18\x0e \x03(\x0b\x32\".edu.stanford.nlp.pipeline.Mention\x12!\n\x19hasCorefMentionAnnotation\x18\x0f \x01(\x08\x12\x1a\n\x12hasCorefAnnotation\x18\x10 \x01(\x08\x12+\n#corefMentionToEntityMentionMappings\x18\x11 \x03(\r\x12+\n#entityMentionToCorefMentionMappings\x18\x12 \x03(\r*\x05\x08\x64\x10\x80\x02\"\x8e\x0f\n\x08Sentence\x12/\n\x05token\x18\x01 \x03(\x0b\x32 .edu.stanford.nlp.pipeline.Token\x12\x18\n\x10tokenOffsetBegin\x18\x02 \x02(\r\x12\x16\n\x0etokenOffsetEnd\x18\x03 \x02(\r\x12\x15\n\rsentenceIndex\x18\x04 \x01(\r\x12\x1c\n\x14\x63haracterOffsetBegin\x18\x05 \x01(\r\x12\x1a\n\x12\x63haracterOffsetEnd\x18\x06 \x01(\r\x12\x37\n\tparseTree\x18\x07 \x01(\x0b\x32$.edu.stanford.nlp.pipeline.ParseTree\x12@\n\x12\x62inarizedParseTree\x18\x1f \x01(\x0b\x32$.edu.stanford.nlp.pipeline.ParseTree\x12@\n\x12\x61nnotatedParseTree\x18 \x01(\x0b\x32$.edu.stanford.nlp.pipeline.ParseTree\x12\x11\n\tsentiment\x18! \x01(\t\x12=\n\x0fkBestParseTrees\x18\" \x03(\x0b\x32$.edu.stanford.nlp.pipeline.ParseTree\x12\x45\n\x11\x62\x61sicDependencies\x18\x08 \x01(\x0b\x32*.edu.stanford.nlp.pipeline.DependencyGraph\x12I\n\x15\x63ollapsedDependencies\x18\t \x01(\x0b\x32*.edu.stanford.nlp.pipeline.DependencyGraph\x12T\n collapsedCCProcessedDependencies\x18\n \x01(\x0b\x32*.edu.stanford.nlp.pipeline.DependencyGraph\x12K\n\x17\x61lternativeDependencies\x18\r \x01(\x0b\x32*.edu.stanford.nlp.pipeline.DependencyGraph\x12?\n\x0copenieTriple\x18\x0e \x03(\x0b\x32).edu.stanford.nlp.pipeline.RelationTriple\x12<\n\tkbpTriple\x18\x10 \x03(\x0b\x32).edu.stanford.nlp.pipeline.RelationTriple\x12\x45\n\x10\x65ntailedSentence\x18\x0f \x03(\x0b\x32+.edu.stanford.nlp.pipeline.SentenceFragment\x12\x43\n\x0e\x65ntailedClause\x18# \x03(\x0b\x32+.edu.stanford.nlp.pipeline.SentenceFragment\x12H\n\x14\x65nhancedDependencies\x18\x11 \x01(\x0b\x32*.edu.stanford.nlp.pipeline.DependencyGraph\x12P\n\x1c\x65nhancedPlusPlusDependencies\x18\x12 \x01(\x0b\x32*.edu.stanford.nlp.pipeline.DependencyGraph\x12\x33\n\tcharacter\x18\x13 \x03(\x0b\x32 .edu.stanford.nlp.pipeline.Token\x12\x11\n\tparagraph\x18\x0b \x01(\r\x12\x0c\n\x04text\x18\x0c \x01(\t\x12\x12\n\nlineNumber\x18\x14 \x01(\r\x12\x1e\n\x16hasRelationAnnotations\x18\x33 \x01(\x08\x12\x31\n\x06\x65ntity\x18\x34 \x03(\x0b\x32!.edu.stanford.nlp.pipeline.Entity\x12\x35\n\x08relation\x18\x35 \x03(\x0b\x32#.edu.stanford.nlp.pipeline.Relation\x12$\n\x1chasNumerizedTokensAnnotation\x18\x36 \x01(\x08\x12\x37\n\x08mentions\x18\x37 \x03(\x0b\x32%.edu.stanford.nlp.pipeline.NERMention\x12<\n\x10mentionsForCoref\x18\x38 \x03(\x0b\x32\".edu.stanford.nlp.pipeline.Mention\x12\"\n\x1ahasCorefMentionsAnnotation\x18\x39 \x01(\x08\x12\x12\n\nsentenceID\x18: \x01(\t\x12\x13\n\x0bsectionDate\x18; \x01(\t\x12\x14\n\x0csectionIndex\x18< \x01(\r\x12\x13\n\x0bsectionName\x18= \x01(\t\x12\x15\n\rsectionAuthor\x18> \x01(\t\x12\r\n\x05\x64ocID\x18? \x01(\t\x12\x15\n\rsectionQuoted\x18@ \x01(\x08\x12#\n\x1bhasEntityMentionsAnnotation\x18\x41 \x01(\x08\x12\x1f\n\x17hasKBPTriplesAnnotation\x18\x44 \x01(\x08\x12\"\n\x1ahasOpenieTriplesAnnotation\x18\x45 \x01(\x08\x12\x14\n\x0c\x63hapterIndex\x18\x42 \x01(\r\x12\x16\n\x0eparagraphIndex\x18\x43 \x01(\r*\x05\x08\x64\x10\x80\x02\"\xad\n\n\x05Token\x12\x0c\n\x04word\x18\x01 \x01(\t\x12\x0b\n\x03pos\x18\x02 \x01(\t\x12\r\n\x05value\x18\x03 \x01(\t\x12\x10\n\x08\x63\x61tegory\x18\x04 \x01(\t\x12\x0e\n\x06\x62\x65\x66ore\x18\x05 \x01(\t\x12\r\n\x05\x61\x66ter\x18\x06 \x01(\t\x12\x14\n\x0coriginalText\x18\x07 \x01(\t\x12\x0b\n\x03ner\x18\x08 \x01(\t\x12\x11\n\tcoarseNER\x18> \x01(\t\x12\x16\n\x0e\x66ineGrainedNER\x18? \x01(\t\x12\x15\n\rnormalizedNER\x18\t \x01(\t\x12\r\n\x05lemma\x18\n \x01(\t\x12\x11\n\tbeginChar\x18\x0b \x01(\r\x12\x0f\n\x07\x65ndChar\x18\x0c \x01(\r\x12\x11\n\tutterance\x18\r \x01(\r\x12\x0f\n\x07speaker\x18\x0e \x01(\t\x12\x12\n\nbeginIndex\x18\x0f \x01(\r\x12\x10\n\x08\x65ndIndex\x18\x10 \x01(\r\x12\x17\n\x0ftokenBeginIndex\x18\x11 \x01(\r\x12\x15\n\rtokenEndIndex\x18\x12 \x01(\r\x12\x34\n\ntimexValue\x18\x13 \x01(\x0b\x32 .edu.stanford.nlp.pipeline.Timex\x12\x15\n\rhasXmlContext\x18\x15 \x01(\x08\x12\x12\n\nxmlContext\x18\x16 \x03(\t\x12\x16\n\x0e\x63orefClusterID\x18\x17 \x01(\r\x12\x0e\n\x06\x61nswer\x18\x18 \x01(\t\x12\x15\n\rheadWordIndex\x18\x1a \x01(\r\x12\x35\n\x08operator\x18\x1b \x01(\x0b\x32#.edu.stanford.nlp.pipeline.Operator\x12\x35\n\x08polarity\x18\x1c \x01(\x0b\x32#.edu.stanford.nlp.pipeline.Polarity\x12\x14\n\x0cpolarity_dir\x18\' \x01(\t\x12-\n\x04span\x18\x1d \x01(\x0b\x32\x1f.edu.stanford.nlp.pipeline.Span\x12\x11\n\tsentiment\x18\x1e \x01(\t\x12\x16\n\x0equotationIndex\x18\x1f \x01(\x05\x12\x42\n\x0e\x63onllUFeatures\x18 \x01(\x0b\x32*.edu.stanford.nlp.pipeline.MapStringString\x12\x11\n\tcoarseTag\x18! \x01(\t\x12\x38\n\x0f\x63onllUTokenSpan\x18\" \x01(\x0b\x32\x1f.edu.stanford.nlp.pipeline.Span\x12\x12\n\nconllUMisc\x18# \x01(\t\x12G\n\x13\x63onllUSecondaryDeps\x18$ \x01(\x0b\x32*.edu.stanford.nlp.pipeline.MapStringString\x12\x17\n\x0fwikipediaEntity\x18% \x01(\t\x12\x11\n\tisNewline\x18& \x01(\x08\x12\x0e\n\x06gender\x18\x33 \x01(\t\x12\x10\n\x08trueCase\x18\x34 \x01(\t\x12\x14\n\x0ctrueCaseText\x18\x35 \x01(\t\x12\x13\n\x0b\x63hineseChar\x18\x36 \x01(\t\x12\x12\n\nchineseSeg\x18\x37 \x01(\t\x12\x16\n\x0e\x63hineseXMLChar\x18< \x01(\t\x12\x13\n\x0bsectionName\x18\x38 \x01(\t\x12\x15\n\rsectionAuthor\x18\x39 \x01(\t\x12\x13\n\x0bsectionDate\x18: \x01(\t\x12\x17\n\x0fsectionEndLabel\x18; \x01(\t\x12\x0e\n\x06parent\x18= \x01(\t\x12\x19\n\x11\x63orefMentionIndex\x18@ \x03(\r\x12\x1a\n\x12\x65ntityMentionIndex\x18\x41 \x01(\r*\x05\x08\x64\x10\x80\x02\"\xe4\x03\n\x05Quote\x12\x0c\n\x04text\x18\x01 \x01(\t\x12\r\n\x05\x62\x65gin\x18\x02 \x01(\r\x12\x0b\n\x03\x65nd\x18\x03 \x01(\r\x12\x15\n\rsentenceBegin\x18\x05 \x01(\r\x12\x13\n\x0bsentenceEnd\x18\x06 \x01(\r\x12\x12\n\ntokenBegin\x18\x07 \x01(\r\x12\x10\n\x08tokenEnd\x18\x08 \x01(\r\x12\r\n\x05\x64ocid\x18\t \x01(\t\x12\r\n\x05index\x18\n \x01(\r\x12\x0e\n\x06\x61uthor\x18\x0b \x01(\t\x12\x0f\n\x07mention\x18\x0c \x01(\t\x12\x14\n\x0cmentionBegin\x18\r \x01(\r\x12\x12\n\nmentionEnd\x18\x0e \x01(\r\x12\x13\n\x0bmentionType\x18\x0f \x01(\t\x12\x14\n\x0cmentionSieve\x18\x10 \x01(\t\x12\x0f\n\x07speaker\x18\x11 \x01(\t\x12\x14\n\x0cspeakerSieve\x18\x12 \x01(\t\x12\x18\n\x10\x63\x61nonicalMention\x18\x13 \x01(\t\x12\x1d\n\x15\x63\x61nonicalMentionBegin\x18\x14 \x01(\r\x12\x1b\n\x13\x63\x61nonicalMentionEnd\x18\x15 \x01(\r\x12N\n\x1a\x61ttributionDependencyGraph\x18\x16 \x01(\x0b\x32*.edu.stanford.nlp.pipeline.DependencyGraph\"\xc7\x01\n\tParseTree\x12\x33\n\x05\x63hild\x18\x01 \x03(\x0b\x32$.edu.stanford.nlp.pipeline.ParseTree\x12\r\n\x05value\x18\x02 \x01(\t\x12\x17\n\x0fyieldBeginIndex\x18\x03 \x01(\r\x12\x15\n\ryieldEndIndex\x18\x04 \x01(\r\x12\r\n\x05score\x18\x05 \x01(\x01\x12\x37\n\tsentiment\x18\x06 \x01(\x0e\x32$.edu.stanford.nlp.pipeline.Sentiment\"\x96\x03\n\x0f\x44\x65pendencyGraph\x12=\n\x04node\x18\x01 \x03(\x0b\x32/.edu.stanford.nlp.pipeline.DependencyGraph.Node\x12=\n\x04\x65\x64ge\x18\x02 \x03(\x0b\x32/.edu.stanford.nlp.pipeline.DependencyGraph.Edge\x12\x10\n\x04root\x18\x03 \x03(\rB\x02\x10\x01\x1a\x44\n\x04Node\x12\x15\n\rsentenceIndex\x18\x01 \x02(\r\x12\r\n\x05index\x18\x02 \x02(\r\x12\x16\n\x0e\x63opyAnnotation\x18\x03 \x01(\r\x1a\xac\x01\n\x04\x45\x64ge\x12\x0e\n\x06source\x18\x01 \x02(\r\x12\x0e\n\x06target\x18\x02 \x02(\r\x12\x0b\n\x03\x64\x65p\x18\x03 \x01(\t\x12\x0f\n\x07isExtra\x18\x04 \x01(\x08\x12\x12\n\nsourceCopy\x18\x05 \x01(\r\x12\x12\n\ntargetCopy\x18\x06 \x01(\r\x12>\n\x08language\x18\x07 \x01(\x0e\x32#.edu.stanford.nlp.pipeline.Language:\x07Unknown\"\xc6\x02\n\nCorefChain\x12\x0f\n\x07\x63hainID\x18\x01 \x02(\x05\x12\x43\n\x07mention\x18\x02 \x03(\x0b\x32\x32.edu.stanford.nlp.pipeline.CorefChain.CorefMention\x12\x16\n\x0erepresentative\x18\x03 \x02(\r\x1a\xc9\x01\n\x0c\x43orefMention\x12\x11\n\tmentionID\x18\x01 \x01(\x05\x12\x13\n\x0bmentionType\x18\x02 \x01(\t\x12\x0e\n\x06number\x18\x03 \x01(\t\x12\x0e\n\x06gender\x18\x04 \x01(\t\x12\x0f\n\x07\x61nimacy\x18\x05 \x01(\t\x12\x12\n\nbeginIndex\x18\x06 \x01(\r\x12\x10\n\x08\x65ndIndex\x18\x07 \x01(\r\x12\x11\n\theadIndex\x18\t \x01(\r\x12\x15\n\rsentenceIndex\x18\n \x01(\r\x12\x10\n\x08position\x18\x0b \x01(\r\"\xef\x08\n\x07Mention\x12\x11\n\tmentionID\x18\x01 \x01(\x05\x12\x13\n\x0bmentionType\x18\x02 \x01(\t\x12\x0e\n\x06number\x18\x03 \x01(\t\x12\x0e\n\x06gender\x18\x04 \x01(\t\x12\x0f\n\x07\x61nimacy\x18\x05 \x01(\t\x12\x0e\n\x06person\x18\x06 \x01(\t\x12\x12\n\nstartIndex\x18\x07 \x01(\r\x12\x10\n\x08\x65ndIndex\x18\t \x01(\r\x12\x11\n\theadIndex\x18\n \x01(\r\x12\x12\n\nheadString\x18\x0b \x01(\t\x12\x11\n\tnerString\x18\x0c \x01(\t\x12\x13\n\x0boriginalRef\x18\r \x01(\r\x12\x1a\n\x12goldCorefClusterID\x18\x0e \x01(\x05\x12\x16\n\x0e\x63orefClusterID\x18\x0f \x01(\x05\x12\x12\n\nmentionNum\x18\x10 \x01(\r\x12\x0f\n\x07sentNum\x18\x11 \x01(\r\x12\r\n\x05utter\x18\x12 \x01(\r\x12\x11\n\tparagraph\x18\x13 \x01(\r\x12\x11\n\tisSubject\x18\x14 \x01(\x08\x12\x16\n\x0eisDirectObject\x18\x15 \x01(\x08\x12\x18\n\x10isIndirectObject\x18\x16 \x01(\x08\x12\x1b\n\x13isPrepositionObject\x18\x17 \x01(\x08\x12\x0f\n\x07hasTwin\x18\x18 \x01(\x08\x12\x0f\n\x07generic\x18\x19 \x01(\x08\x12\x13\n\x0bisSingleton\x18\x1a \x01(\x08\x12\x1a\n\x12hasBasicDependency\x18\x1b \x01(\x08\x12\x1d\n\x15hasEnhancedDepenedncy\x18\x1c \x01(\x08\x12\x1b\n\x13hasContextParseTree\x18\x1d \x01(\x08\x12?\n\x0fheadIndexedWord\x18\x1e \x01(\x0b\x32&.edu.stanford.nlp.pipeline.IndexedWord\x12=\n\rdependingVerb\x18\x1f \x01(\x0b\x32&.edu.stanford.nlp.pipeline.IndexedWord\x12\x38\n\x08headWord\x18 \x01(\x0b\x32&.edu.stanford.nlp.pipeline.IndexedWord\x12;\n\x0bspeakerInfo\x18! \x01(\x0b\x32&.edu.stanford.nlp.pipeline.SpeakerInfo\x12=\n\rsentenceWords\x18\x32 \x03(\x0b\x32&.edu.stanford.nlp.pipeline.IndexedWord\x12<\n\x0coriginalSpan\x18\x33 \x03(\x0b\x32&.edu.stanford.nlp.pipeline.IndexedWord\x12\x12\n\ndependents\x18\x34 \x03(\t\x12\x19\n\x11preprocessedTerms\x18\x35 \x03(\t\x12\x13\n\x0b\x61ppositions\x18\x36 \x03(\x05\x12\x1c\n\x14predicateNominatives\x18\x37 \x03(\x05\x12\x18\n\x10relativePronouns\x18\x38 \x03(\x05\x12\x13\n\x0blistMembers\x18\x39 \x03(\x05\x12\x15\n\rbelongToLists\x18: \x03(\x05\"X\n\x0bIndexedWord\x12\x13\n\x0bsentenceNum\x18\x01 \x01(\r\x12\x12\n\ntokenIndex\x18\x02 \x01(\r\x12\r\n\x05\x64ocID\x18\x03 \x01(\r\x12\x11\n\tcopyCount\x18\x04 \x01(\r\"4\n\x0bSpeakerInfo\x12\x13\n\x0bspeakerName\x18\x01 \x01(\t\x12\x10\n\x08mentions\x18\x02 \x03(\x05\"\"\n\x04Span\x12\r\n\x05\x62\x65gin\x18\x01 \x02(\r\x12\x0b\n\x03\x65nd\x18\x02 \x02(\r\"w\n\x05Timex\x12\r\n\x05value\x18\x01 \x01(\t\x12\x10\n\x08\x61ltValue\x18\x02 \x01(\t\x12\x0c\n\x04text\x18\x03 \x01(\t\x12\x0c\n\x04type\x18\x04 \x01(\t\x12\x0b\n\x03tid\x18\x05 \x01(\t\x12\x12\n\nbeginPoint\x18\x06 \x01(\r\x12\x10\n\x08\x65ndPoint\x18\x07 \x01(\r\"\xdb\x01\n\x06\x45ntity\x12\x11\n\theadStart\x18\x06 \x01(\r\x12\x0f\n\x07headEnd\x18\x07 \x01(\r\x12\x13\n\x0bmentionType\x18\x08 \x01(\t\x12\x16\n\x0enormalizedName\x18\t \x01(\t\x12\x16\n\x0eheadTokenIndex\x18\n \x01(\r\x12\x0f\n\x07\x63orefID\x18\x0b \x01(\t\x12\x10\n\x08objectID\x18\x01 \x01(\t\x12\x13\n\x0b\x65xtentStart\x18\x02 \x01(\r\x12\x11\n\textentEnd\x18\x03 \x01(\r\x12\x0c\n\x04type\x18\x04 \x01(\t\x12\x0f\n\x07subtype\x18\x05 \x01(\t\"\xb7\x01\n\x08Relation\x12\x0f\n\x07\x61rgName\x18\x06 \x03(\t\x12.\n\x03\x61rg\x18\x07 \x03(\x0b\x32!.edu.stanford.nlp.pipeline.Entity\x12\x11\n\tsignature\x18\x08 \x01(\t\x12\x10\n\x08objectID\x18\x01 \x01(\t\x12\x13\n\x0b\x65xtentStart\x18\x02 \x01(\r\x12\x11\n\textentEnd\x18\x03 \x01(\r\x12\x0c\n\x04type\x18\x04 \x01(\t\x12\x0f\n\x07subtype\x18\x05 \x01(\t\"\xb2\x01\n\x08Operator\x12\x0c\n\x04name\x18\x01 \x02(\t\x12\x1b\n\x13quantifierSpanBegin\x18\x02 \x02(\x05\x12\x19\n\x11quantifierSpanEnd\x18\x03 \x02(\x05\x12\x18\n\x10subjectSpanBegin\x18\x04 \x02(\x05\x12\x16\n\x0esubjectSpanEnd\x18\x05 \x02(\x05\x12\x17\n\x0fobjectSpanBegin\x18\x06 \x02(\x05\x12\x15\n\robjectSpanEnd\x18\x07 \x02(\x05\"\xa9\x04\n\x08Polarity\x12K\n\x12projectEquivalence\x18\x01 \x02(\x0e\x32/.edu.stanford.nlp.pipeline.NaturalLogicRelation\x12Q\n\x18projectForwardEntailment\x18\x02 \x02(\x0e\x32/.edu.stanford.nlp.pipeline.NaturalLogicRelation\x12Q\n\x18projectReverseEntailment\x18\x03 \x02(\x0e\x32/.edu.stanford.nlp.pipeline.NaturalLogicRelation\x12H\n\x0fprojectNegation\x18\x04 \x02(\x0e\x32/.edu.stanford.nlp.pipeline.NaturalLogicRelation\x12K\n\x12projectAlternation\x18\x05 \x02(\x0e\x32/.edu.stanford.nlp.pipeline.NaturalLogicRelation\x12\x45\n\x0cprojectCover\x18\x06 \x02(\x0e\x32/.edu.stanford.nlp.pipeline.NaturalLogicRelation\x12L\n\x13projectIndependence\x18\x07 \x02(\x0e\x32/.edu.stanford.nlp.pipeline.NaturalLogicRelation\"\xdd\x02\n\nNERMention\x12\x15\n\rsentenceIndex\x18\x01 \x01(\r\x12%\n\x1dtokenStartInSentenceInclusive\x18\x02 \x02(\r\x12#\n\x1btokenEndInSentenceExclusive\x18\x03 \x02(\r\x12\x0b\n\x03ner\x18\x04 \x02(\t\x12\x15\n\rnormalizedNER\x18\x05 \x01(\t\x12\x12\n\nentityType\x18\x06 \x01(\t\x12/\n\x05timex\x18\x07 \x01(\x0b\x32 .edu.stanford.nlp.pipeline.Timex\x12\x17\n\x0fwikipediaEntity\x18\x08 \x01(\t\x12\x0e\n\x06gender\x18\t \x01(\t\x12\x1a\n\x12\x65ntityMentionIndex\x18\n \x01(\r\x12#\n\x1b\x63\x61nonicalEntityMentionIndex\x18\x0b \x01(\r\x12\x19\n\x11\x65ntityMentionText\x18\x0c \x01(\t\"Y\n\x10SentenceFragment\x12\x12\n\ntokenIndex\x18\x01 \x03(\r\x12\x0c\n\x04root\x18\x02 \x01(\r\x12\x14\n\x0c\x61ssumedTruth\x18\x03 \x01(\x08\x12\r\n\x05score\x18\x04 \x01(\x01\":\n\rTokenLocation\x12\x15\n\rsentenceIndex\x18\x01 \x01(\r\x12\x12\n\ntokenIndex\x18\x02 \x01(\r\"\x9a\x03\n\x0eRelationTriple\x12\x0f\n\x07subject\x18\x01 \x01(\t\x12\x10\n\x08relation\x18\x02 \x01(\t\x12\x0e\n\x06object\x18\x03 \x01(\t\x12\x12\n\nconfidence\x18\x04 \x01(\x01\x12?\n\rsubjectTokens\x18\r \x03(\x0b\x32(.edu.stanford.nlp.pipeline.TokenLocation\x12@\n\x0erelationTokens\x18\x0e \x03(\x0b\x32(.edu.stanford.nlp.pipeline.TokenLocation\x12>\n\x0cobjectTokens\x18\x0f \x03(\x0b\x32(.edu.stanford.nlp.pipeline.TokenLocation\x12\x38\n\x04tree\x18\x08 \x01(\x0b\x32*.edu.stanford.nlp.pipeline.DependencyGraph\x12\x0e\n\x06istmod\x18\t \x01(\x08\x12\x10\n\x08prefixBe\x18\n \x01(\x08\x12\x10\n\x08suffixBe\x18\x0b \x01(\x08\x12\x10\n\x08suffixOf\x18\x0c \x01(\x08\"-\n\x0fMapStringString\x12\x0b\n\x03key\x18\x01 \x03(\t\x12\r\n\x05value\x18\x02 \x03(\t\"*\n\x0cMapIntString\x12\x0b\n\x03key\x18\x01 \x03(\r\x12\r\n\x05value\x18\x02 \x03(\t\"\xfc\x01\n\x07Section\x12\x11\n\tcharBegin\x18\x01 \x02(\r\x12\x0f\n\x07\x63harEnd\x18\x02 \x02(\r\x12\x0e\n\x06\x61uthor\x18\x03 \x01(\t\x12\x17\n\x0fsentenceIndexes\x18\x04 \x03(\r\x12\x10\n\x08\x64\x61tetime\x18\x05 \x01(\t\x12\x30\n\x06quotes\x18\x06 \x03(\x0b\x32 .edu.stanford.nlp.pipeline.Quote\x12\x17\n\x0f\x61uthorCharBegin\x18\x07 \x01(\r\x12\x15\n\rauthorCharEnd\x18\x08 \x01(\r\x12\x30\n\x06xmlTag\x18\t \x02(\x0b\x32 .edu.stanford.nlp.pipeline.Token*\xa3\x01\n\x08Language\x12\x0b\n\x07Unknown\x10\x00\x12\x07\n\x03\x41ny\x10\x01\x12\n\n\x06\x41rabic\x10\x02\x12\x0b\n\x07\x43hinese\x10\x03\x12\x0b\n\x07\x45nglish\x10\x04\x12\n\n\x06German\x10\x05\x12\n\n\x06\x46rench\x10\x06\x12\n\n\x06Hebrew\x10\x07\x12\x0b\n\x07Spanish\x10\x08\x12\x14\n\x10UniversalEnglish\x10\t\x12\x14\n\x10UniversalChinese\x10\n*h\n\tSentiment\x12\x13\n\x0fSTRONG_NEGATIVE\x10\x00\x12\x11\n\rWEAK_NEGATIVE\x10\x01\x12\x0b\n\x07NEUTRAL\x10\x02\x12\x11\n\rWEAK_POSITIVE\x10\x03\x12\x13\n\x0fSTRONG_POSITIVE\x10\x04*\x93\x01\n\x14NaturalLogicRelation\x12\x0f\n\x0b\x45QUIVALENCE\x10\x00\x12\x16\n\x12\x46ORWARD_ENTAILMENT\x10\x01\x12\x16\n\x12REVERSE_ENTAILMENT\x10\x02\x12\x0c\n\x08NEGATION\x10\x03\x12\x0f\n\x0b\x41LTERNATION\x10\x04\x12\t\n\x05\x43OVER\x10\x05\x12\x10\n\x0cINDEPENDENCE\x10\x06\x42*\n\x19\x65\x64u.stanford.nlp.pipelineB\rCoreNLPProtos') 24 | ) 25 | 26 | _LANGUAGE = _descriptor.EnumDescriptor( 27 | name='Language', 28 | full_name='edu.stanford.nlp.pipeline.Language', 29 | filename=None, 30 | file=DESCRIPTOR, 31 | values=[ 32 | _descriptor.EnumValueDescriptor( 33 | name='Unknown', index=0, number=0, 34 | options=None, 35 | type=None), 36 | _descriptor.EnumValueDescriptor( 37 | name='Any', index=1, number=1, 38 | options=None, 39 | type=None), 40 | _descriptor.EnumValueDescriptor( 41 | name='Arabic', index=2, number=2, 42 | options=None, 43 | type=None), 44 | _descriptor.EnumValueDescriptor( 45 | name='Chinese', index=3, number=3, 46 | options=None, 47 | type=None), 48 | _descriptor.EnumValueDescriptor( 49 | name='English', index=4, number=4, 50 | options=None, 51 | type=None), 52 | _descriptor.EnumValueDescriptor( 53 | name='German', index=5, number=5, 54 | options=None, 55 | type=None), 56 | _descriptor.EnumValueDescriptor( 57 | name='French', index=6, number=6, 58 | options=None, 59 | type=None), 60 | _descriptor.EnumValueDescriptor( 61 | name='Hebrew', index=7, number=7, 62 | options=None, 63 | type=None), 64 | _descriptor.EnumValueDescriptor( 65 | name='Spanish', index=8, number=8, 66 | options=None, 67 | type=None), 68 | _descriptor.EnumValueDescriptor( 69 | name='UniversalEnglish', index=9, number=9, 70 | options=None, 71 | type=None), 72 | _descriptor.EnumValueDescriptor( 73 | name='UniversalChinese', index=10, number=10, 74 | options=None, 75 | type=None), 76 | ], 77 | containing_type=None, 78 | options=None, 79 | serialized_start=9323, 80 | serialized_end=9486, 81 | ) 82 | _sym_db.RegisterEnumDescriptor(_LANGUAGE) 83 | 84 | Language = enum_type_wrapper.EnumTypeWrapper(_LANGUAGE) 85 | _SENTIMENT = _descriptor.EnumDescriptor( 86 | name='Sentiment', 87 | full_name='edu.stanford.nlp.pipeline.Sentiment', 88 | filename=None, 89 | file=DESCRIPTOR, 90 | values=[ 91 | _descriptor.EnumValueDescriptor( 92 | name='STRONG_NEGATIVE', index=0, number=0, 93 | options=None, 94 | type=None), 95 | _descriptor.EnumValueDescriptor( 96 | name='WEAK_NEGATIVE', index=1, number=1, 97 | options=None, 98 | type=None), 99 | _descriptor.EnumValueDescriptor( 100 | name='NEUTRAL', index=2, number=2, 101 | options=None, 102 | type=None), 103 | _descriptor.EnumValueDescriptor( 104 | name='WEAK_POSITIVE', index=3, number=3, 105 | options=None, 106 | type=None), 107 | _descriptor.EnumValueDescriptor( 108 | name='STRONG_POSITIVE', index=4, number=4, 109 | options=None, 110 | type=None), 111 | ], 112 | containing_type=None, 113 | options=None, 114 | serialized_start=9488, 115 | serialized_end=9592, 116 | ) 117 | _sym_db.RegisterEnumDescriptor(_SENTIMENT) 118 | 119 | Sentiment = enum_type_wrapper.EnumTypeWrapper(_SENTIMENT) 120 | _NATURALLOGICRELATION = _descriptor.EnumDescriptor( 121 | name='NaturalLogicRelation', 122 | full_name='edu.stanford.nlp.pipeline.NaturalLogicRelation', 123 | filename=None, 124 | file=DESCRIPTOR, 125 | values=[ 126 | _descriptor.EnumValueDescriptor( 127 | name='EQUIVALENCE', index=0, number=0, 128 | options=None, 129 | type=None), 130 | _descriptor.EnumValueDescriptor( 131 | name='FORWARD_ENTAILMENT', index=1, number=1, 132 | options=None, 133 | type=None), 134 | _descriptor.EnumValueDescriptor( 135 | name='REVERSE_ENTAILMENT', index=2, number=2, 136 | options=None, 137 | type=None), 138 | _descriptor.EnumValueDescriptor( 139 | name='NEGATION', index=3, number=3, 140 | options=None, 141 | type=None), 142 | _descriptor.EnumValueDescriptor( 143 | name='ALTERNATION', index=4, number=4, 144 | options=None, 145 | type=None), 146 | _descriptor.EnumValueDescriptor( 147 | name='COVER', index=5, number=5, 148 | options=None, 149 | type=None), 150 | _descriptor.EnumValueDescriptor( 151 | name='INDEPENDENCE', index=6, number=6, 152 | options=None, 153 | type=None), 154 | ], 155 | containing_type=None, 156 | options=None, 157 | serialized_start=9595, 158 | serialized_end=9742, 159 | ) 160 | _sym_db.RegisterEnumDescriptor(_NATURALLOGICRELATION) 161 | 162 | NaturalLogicRelation = enum_type_wrapper.EnumTypeWrapper(_NATURALLOGICRELATION) 163 | Unknown = 0 164 | Any = 1 165 | Arabic = 2 166 | Chinese = 3 167 | English = 4 168 | German = 5 169 | French = 6 170 | Hebrew = 7 171 | Spanish = 8 172 | UniversalEnglish = 9 173 | UniversalChinese = 10 174 | STRONG_NEGATIVE = 0 175 | WEAK_NEGATIVE = 1 176 | NEUTRAL = 2 177 | WEAK_POSITIVE = 3 178 | STRONG_POSITIVE = 4 179 | EQUIVALENCE = 0 180 | FORWARD_ENTAILMENT = 1 181 | REVERSE_ENTAILMENT = 2 182 | NEGATION = 3 183 | ALTERNATION = 4 184 | COVER = 5 185 | INDEPENDENCE = 6 186 | 187 | 188 | 189 | _DOCUMENT = _descriptor.Descriptor( 190 | name='Document', 191 | full_name='edu.stanford.nlp.pipeline.Document', 192 | filename=None, 193 | file=DESCRIPTOR, 194 | containing_type=None, 195 | fields=[ 196 | _descriptor.FieldDescriptor( 197 | name='text', full_name='edu.stanford.nlp.pipeline.Document.text', index=0, 198 | number=1, type=9, cpp_type=9, label=2, 199 | has_default_value=False, default_value=_b("").decode('utf-8'), 200 | message_type=None, enum_type=None, containing_type=None, 201 | is_extension=False, extension_scope=None, 202 | options=None, file=DESCRIPTOR), 203 | _descriptor.FieldDescriptor( 204 | name='sentence', full_name='edu.stanford.nlp.pipeline.Document.sentence', index=1, 205 | number=2, type=11, cpp_type=10, label=3, 206 | has_default_value=False, default_value=[], 207 | message_type=None, enum_type=None, containing_type=None, 208 | is_extension=False, extension_scope=None, 209 | options=None, file=DESCRIPTOR), 210 | _descriptor.FieldDescriptor( 211 | name='corefChain', full_name='edu.stanford.nlp.pipeline.Document.corefChain', index=2, 212 | number=3, type=11, cpp_type=10, label=3, 213 | has_default_value=False, default_value=[], 214 | message_type=None, enum_type=None, containing_type=None, 215 | is_extension=False, extension_scope=None, 216 | options=None, file=DESCRIPTOR), 217 | _descriptor.FieldDescriptor( 218 | name='docID', full_name='edu.stanford.nlp.pipeline.Document.docID', index=3, 219 | number=4, type=9, cpp_type=9, label=1, 220 | has_default_value=False, default_value=_b("").decode('utf-8'), 221 | message_type=None, enum_type=None, containing_type=None, 222 | is_extension=False, extension_scope=None, 223 | options=None, file=DESCRIPTOR), 224 | _descriptor.FieldDescriptor( 225 | name='docDate', full_name='edu.stanford.nlp.pipeline.Document.docDate', index=4, 226 | number=7, type=9, cpp_type=9, label=1, 227 | has_default_value=False, default_value=_b("").decode('utf-8'), 228 | message_type=None, enum_type=None, containing_type=None, 229 | is_extension=False, extension_scope=None, 230 | options=None, file=DESCRIPTOR), 231 | _descriptor.FieldDescriptor( 232 | name='calendar', full_name='edu.stanford.nlp.pipeline.Document.calendar', index=5, 233 | number=8, type=4, cpp_type=4, label=1, 234 | has_default_value=False, default_value=0, 235 | message_type=None, enum_type=None, containing_type=None, 236 | is_extension=False, extension_scope=None, 237 | options=None, file=DESCRIPTOR), 238 | _descriptor.FieldDescriptor( 239 | name='sentencelessToken', full_name='edu.stanford.nlp.pipeline.Document.sentencelessToken', index=6, 240 | number=5, type=11, cpp_type=10, label=3, 241 | has_default_value=False, default_value=[], 242 | message_type=None, enum_type=None, containing_type=None, 243 | is_extension=False, extension_scope=None, 244 | options=None, file=DESCRIPTOR), 245 | _descriptor.FieldDescriptor( 246 | name='character', full_name='edu.stanford.nlp.pipeline.Document.character', index=7, 247 | number=10, type=11, cpp_type=10, label=3, 248 | has_default_value=False, default_value=[], 249 | message_type=None, enum_type=None, containing_type=None, 250 | is_extension=False, extension_scope=None, 251 | options=None, file=DESCRIPTOR), 252 | _descriptor.FieldDescriptor( 253 | name='quote', full_name='edu.stanford.nlp.pipeline.Document.quote', index=8, 254 | number=6, type=11, cpp_type=10, label=3, 255 | has_default_value=False, default_value=[], 256 | message_type=None, enum_type=None, containing_type=None, 257 | is_extension=False, extension_scope=None, 258 | options=None, file=DESCRIPTOR), 259 | _descriptor.FieldDescriptor( 260 | name='mentions', full_name='edu.stanford.nlp.pipeline.Document.mentions', index=9, 261 | number=9, type=11, cpp_type=10, label=3, 262 | has_default_value=False, default_value=[], 263 | message_type=None, enum_type=None, containing_type=None, 264 | is_extension=False, extension_scope=None, 265 | options=None, file=DESCRIPTOR), 266 | _descriptor.FieldDescriptor( 267 | name='hasEntityMentionsAnnotation', full_name='edu.stanford.nlp.pipeline.Document.hasEntityMentionsAnnotation', index=10, 268 | number=13, type=8, cpp_type=7, label=1, 269 | has_default_value=False, default_value=False, 270 | message_type=None, enum_type=None, containing_type=None, 271 | is_extension=False, extension_scope=None, 272 | options=None, file=DESCRIPTOR), 273 | _descriptor.FieldDescriptor( 274 | name='xmlDoc', full_name='edu.stanford.nlp.pipeline.Document.xmlDoc', index=11, 275 | number=11, type=8, cpp_type=7, label=1, 276 | has_default_value=False, default_value=False, 277 | message_type=None, enum_type=None, containing_type=None, 278 | is_extension=False, extension_scope=None, 279 | options=None, file=DESCRIPTOR), 280 | _descriptor.FieldDescriptor( 281 | name='sections', full_name='edu.stanford.nlp.pipeline.Document.sections', index=12, 282 | number=12, type=11, cpp_type=10, label=3, 283 | has_default_value=False, default_value=[], 284 | message_type=None, enum_type=None, containing_type=None, 285 | is_extension=False, extension_scope=None, 286 | options=None, file=DESCRIPTOR), 287 | _descriptor.FieldDescriptor( 288 | name='mentionsForCoref', full_name='edu.stanford.nlp.pipeline.Document.mentionsForCoref', index=13, 289 | number=14, type=11, cpp_type=10, label=3, 290 | has_default_value=False, default_value=[], 291 | message_type=None, enum_type=None, containing_type=None, 292 | is_extension=False, extension_scope=None, 293 | options=None, file=DESCRIPTOR), 294 | _descriptor.FieldDescriptor( 295 | name='hasCorefMentionAnnotation', full_name='edu.stanford.nlp.pipeline.Document.hasCorefMentionAnnotation', index=14, 296 | number=15, type=8, cpp_type=7, label=1, 297 | has_default_value=False, default_value=False, 298 | message_type=None, enum_type=None, containing_type=None, 299 | is_extension=False, extension_scope=None, 300 | options=None, file=DESCRIPTOR), 301 | _descriptor.FieldDescriptor( 302 | name='hasCorefAnnotation', full_name='edu.stanford.nlp.pipeline.Document.hasCorefAnnotation', index=15, 303 | number=16, type=8, cpp_type=7, label=1, 304 | has_default_value=False, default_value=False, 305 | message_type=None, enum_type=None, containing_type=None, 306 | is_extension=False, extension_scope=None, 307 | options=None, file=DESCRIPTOR), 308 | _descriptor.FieldDescriptor( 309 | name='corefMentionToEntityMentionMappings', full_name='edu.stanford.nlp.pipeline.Document.corefMentionToEntityMentionMappings', index=16, 310 | number=17, type=13, cpp_type=3, label=3, 311 | has_default_value=False, default_value=[], 312 | message_type=None, enum_type=None, containing_type=None, 313 | is_extension=False, extension_scope=None, 314 | options=None, file=DESCRIPTOR), 315 | _descriptor.FieldDescriptor( 316 | name='entityMentionToCorefMentionMappings', full_name='edu.stanford.nlp.pipeline.Document.entityMentionToCorefMentionMappings', index=17, 317 | number=18, type=13, cpp_type=3, label=3, 318 | has_default_value=False, default_value=[], 319 | message_type=None, enum_type=None, containing_type=None, 320 | is_extension=False, extension_scope=None, 321 | options=None, file=DESCRIPTOR), 322 | ], 323 | extensions=[ 324 | ], 325 | nested_types=[], 326 | enum_types=[ 327 | ], 328 | options=None, 329 | is_extendable=True, 330 | syntax='proto2', 331 | extension_ranges=[(100, 256), ], 332 | oneofs=[ 333 | ], 334 | serialized_start=45, 335 | serialized_end=782, 336 | ) 337 | 338 | 339 | _SENTENCE = _descriptor.Descriptor( 340 | name='Sentence', 341 | full_name='edu.stanford.nlp.pipeline.Sentence', 342 | filename=None, 343 | file=DESCRIPTOR, 344 | containing_type=None, 345 | fields=[ 346 | _descriptor.FieldDescriptor( 347 | name='token', full_name='edu.stanford.nlp.pipeline.Sentence.token', index=0, 348 | number=1, type=11, cpp_type=10, label=3, 349 | has_default_value=False, default_value=[], 350 | message_type=None, enum_type=None, containing_type=None, 351 | is_extension=False, extension_scope=None, 352 | options=None, file=DESCRIPTOR), 353 | _descriptor.FieldDescriptor( 354 | name='tokenOffsetBegin', full_name='edu.stanford.nlp.pipeline.Sentence.tokenOffsetBegin', index=1, 355 | number=2, type=13, cpp_type=3, label=2, 356 | has_default_value=False, default_value=0, 357 | message_type=None, enum_type=None, containing_type=None, 358 | is_extension=False, extension_scope=None, 359 | options=None, file=DESCRIPTOR), 360 | _descriptor.FieldDescriptor( 361 | name='tokenOffsetEnd', full_name='edu.stanford.nlp.pipeline.Sentence.tokenOffsetEnd', index=2, 362 | number=3, type=13, cpp_type=3, label=2, 363 | has_default_value=False, default_value=0, 364 | message_type=None, enum_type=None, containing_type=None, 365 | is_extension=False, extension_scope=None, 366 | options=None, file=DESCRIPTOR), 367 | _descriptor.FieldDescriptor( 368 | name='sentenceIndex', full_name='edu.stanford.nlp.pipeline.Sentence.sentenceIndex', index=3, 369 | number=4, type=13, cpp_type=3, label=1, 370 | has_default_value=False, default_value=0, 371 | message_type=None, enum_type=None, containing_type=None, 372 | is_extension=False, extension_scope=None, 373 | options=None, file=DESCRIPTOR), 374 | _descriptor.FieldDescriptor( 375 | name='characterOffsetBegin', full_name='edu.stanford.nlp.pipeline.Sentence.characterOffsetBegin', index=4, 376 | number=5, type=13, cpp_type=3, label=1, 377 | has_default_value=False, default_value=0, 378 | message_type=None, enum_type=None, containing_type=None, 379 | is_extension=False, extension_scope=None, 380 | options=None, file=DESCRIPTOR), 381 | _descriptor.FieldDescriptor( 382 | name='characterOffsetEnd', full_name='edu.stanford.nlp.pipeline.Sentence.characterOffsetEnd', index=5, 383 | number=6, type=13, cpp_type=3, label=1, 384 | has_default_value=False, default_value=0, 385 | message_type=None, enum_type=None, containing_type=None, 386 | is_extension=False, extension_scope=None, 387 | options=None, file=DESCRIPTOR), 388 | _descriptor.FieldDescriptor( 389 | name='parseTree', full_name='edu.stanford.nlp.pipeline.Sentence.parseTree', index=6, 390 | number=7, type=11, cpp_type=10, label=1, 391 | has_default_value=False, default_value=None, 392 | message_type=None, enum_type=None, containing_type=None, 393 | is_extension=False, extension_scope=None, 394 | options=None, file=DESCRIPTOR), 395 | _descriptor.FieldDescriptor( 396 | name='binarizedParseTree', full_name='edu.stanford.nlp.pipeline.Sentence.binarizedParseTree', index=7, 397 | number=31, type=11, cpp_type=10, label=1, 398 | has_default_value=False, default_value=None, 399 | message_type=None, enum_type=None, containing_type=None, 400 | is_extension=False, extension_scope=None, 401 | options=None, file=DESCRIPTOR), 402 | _descriptor.FieldDescriptor( 403 | name='annotatedParseTree', full_name='edu.stanford.nlp.pipeline.Sentence.annotatedParseTree', index=8, 404 | number=32, type=11, cpp_type=10, label=1, 405 | has_default_value=False, default_value=None, 406 | message_type=None, enum_type=None, containing_type=None, 407 | is_extension=False, extension_scope=None, 408 | options=None, file=DESCRIPTOR), 409 | _descriptor.FieldDescriptor( 410 | name='sentiment', full_name='edu.stanford.nlp.pipeline.Sentence.sentiment', index=9, 411 | number=33, type=9, cpp_type=9, label=1, 412 | has_default_value=False, default_value=_b("").decode('utf-8'), 413 | message_type=None, enum_type=None, containing_type=None, 414 | is_extension=False, extension_scope=None, 415 | options=None, file=DESCRIPTOR), 416 | _descriptor.FieldDescriptor( 417 | name='kBestParseTrees', full_name='edu.stanford.nlp.pipeline.Sentence.kBestParseTrees', index=10, 418 | number=34, type=11, cpp_type=10, label=3, 419 | has_default_value=False, default_value=[], 420 | message_type=None, enum_type=None, containing_type=None, 421 | is_extension=False, extension_scope=None, 422 | options=None, file=DESCRIPTOR), 423 | _descriptor.FieldDescriptor( 424 | name='basicDependencies', full_name='edu.stanford.nlp.pipeline.Sentence.basicDependencies', index=11, 425 | number=8, type=11, cpp_type=10, label=1, 426 | has_default_value=False, default_value=None, 427 | message_type=None, enum_type=None, containing_type=None, 428 | is_extension=False, extension_scope=None, 429 | options=None, file=DESCRIPTOR), 430 | _descriptor.FieldDescriptor( 431 | name='collapsedDependencies', full_name='edu.stanford.nlp.pipeline.Sentence.collapsedDependencies', index=12, 432 | number=9, type=11, cpp_type=10, label=1, 433 | has_default_value=False, default_value=None, 434 | message_type=None, enum_type=None, containing_type=None, 435 | is_extension=False, extension_scope=None, 436 | options=None, file=DESCRIPTOR), 437 | _descriptor.FieldDescriptor( 438 | name='collapsedCCProcessedDependencies', full_name='edu.stanford.nlp.pipeline.Sentence.collapsedCCProcessedDependencies', index=13, 439 | number=10, type=11, cpp_type=10, label=1, 440 | has_default_value=False, default_value=None, 441 | message_type=None, enum_type=None, containing_type=None, 442 | is_extension=False, extension_scope=None, 443 | options=None, file=DESCRIPTOR), 444 | _descriptor.FieldDescriptor( 445 | name='alternativeDependencies', full_name='edu.stanford.nlp.pipeline.Sentence.alternativeDependencies', index=14, 446 | number=13, type=11, cpp_type=10, label=1, 447 | has_default_value=False, default_value=None, 448 | message_type=None, enum_type=None, containing_type=None, 449 | is_extension=False, extension_scope=None, 450 | options=None, file=DESCRIPTOR), 451 | _descriptor.FieldDescriptor( 452 | name='openieTriple', full_name='edu.stanford.nlp.pipeline.Sentence.openieTriple', index=15, 453 | number=14, type=11, cpp_type=10, label=3, 454 | has_default_value=False, default_value=[], 455 | message_type=None, enum_type=None, containing_type=None, 456 | is_extension=False, extension_scope=None, 457 | options=None, file=DESCRIPTOR), 458 | _descriptor.FieldDescriptor( 459 | name='kbpTriple', full_name='edu.stanford.nlp.pipeline.Sentence.kbpTriple', index=16, 460 | number=16, type=11, cpp_type=10, label=3, 461 | has_default_value=False, default_value=[], 462 | message_type=None, enum_type=None, containing_type=None, 463 | is_extension=False, extension_scope=None, 464 | options=None, file=DESCRIPTOR), 465 | _descriptor.FieldDescriptor( 466 | name='entailedSentence', full_name='edu.stanford.nlp.pipeline.Sentence.entailedSentence', index=17, 467 | number=15, type=11, cpp_type=10, label=3, 468 | has_default_value=False, default_value=[], 469 | message_type=None, enum_type=None, containing_type=None, 470 | is_extension=False, extension_scope=None, 471 | options=None, file=DESCRIPTOR), 472 | _descriptor.FieldDescriptor( 473 | name='entailedClause', full_name='edu.stanford.nlp.pipeline.Sentence.entailedClause', index=18, 474 | number=35, type=11, cpp_type=10, label=3, 475 | has_default_value=False, default_value=[], 476 | message_type=None, enum_type=None, containing_type=None, 477 | is_extension=False, extension_scope=None, 478 | options=None, file=DESCRIPTOR), 479 | _descriptor.FieldDescriptor( 480 | name='enhancedDependencies', full_name='edu.stanford.nlp.pipeline.Sentence.enhancedDependencies', index=19, 481 | number=17, type=11, cpp_type=10, label=1, 482 | has_default_value=False, default_value=None, 483 | message_type=None, enum_type=None, containing_type=None, 484 | is_extension=False, extension_scope=None, 485 | options=None, file=DESCRIPTOR), 486 | _descriptor.FieldDescriptor( 487 | name='enhancedPlusPlusDependencies', full_name='edu.stanford.nlp.pipeline.Sentence.enhancedPlusPlusDependencies', index=20, 488 | number=18, type=11, cpp_type=10, label=1, 489 | has_default_value=False, default_value=None, 490 | message_type=None, enum_type=None, containing_type=None, 491 | is_extension=False, extension_scope=None, 492 | options=None, file=DESCRIPTOR), 493 | _descriptor.FieldDescriptor( 494 | name='character', full_name='edu.stanford.nlp.pipeline.Sentence.character', index=21, 495 | number=19, type=11, cpp_type=10, label=3, 496 | has_default_value=False, default_value=[], 497 | message_type=None, enum_type=None, containing_type=None, 498 | is_extension=False, extension_scope=None, 499 | options=None, file=DESCRIPTOR), 500 | _descriptor.FieldDescriptor( 501 | name='paragraph', full_name='edu.stanford.nlp.pipeline.Sentence.paragraph', index=22, 502 | number=11, type=13, cpp_type=3, label=1, 503 | has_default_value=False, default_value=0, 504 | message_type=None, enum_type=None, containing_type=None, 505 | is_extension=False, extension_scope=None, 506 | options=None, file=DESCRIPTOR), 507 | _descriptor.FieldDescriptor( 508 | name='text', full_name='edu.stanford.nlp.pipeline.Sentence.text', index=23, 509 | number=12, type=9, cpp_type=9, label=1, 510 | has_default_value=False, default_value=_b("").decode('utf-8'), 511 | message_type=None, enum_type=None, containing_type=None, 512 | is_extension=False, extension_scope=None, 513 | options=None, file=DESCRIPTOR), 514 | _descriptor.FieldDescriptor( 515 | name='lineNumber', full_name='edu.stanford.nlp.pipeline.Sentence.lineNumber', index=24, 516 | number=20, type=13, cpp_type=3, label=1, 517 | has_default_value=False, default_value=0, 518 | message_type=None, enum_type=None, containing_type=None, 519 | is_extension=False, extension_scope=None, 520 | options=None, file=DESCRIPTOR), 521 | _descriptor.FieldDescriptor( 522 | name='hasRelationAnnotations', full_name='edu.stanford.nlp.pipeline.Sentence.hasRelationAnnotations', index=25, 523 | number=51, type=8, cpp_type=7, label=1, 524 | has_default_value=False, default_value=False, 525 | message_type=None, enum_type=None, containing_type=None, 526 | is_extension=False, extension_scope=None, 527 | options=None, file=DESCRIPTOR), 528 | _descriptor.FieldDescriptor( 529 | name='entity', full_name='edu.stanford.nlp.pipeline.Sentence.entity', index=26, 530 | number=52, type=11, cpp_type=10, label=3, 531 | has_default_value=False, default_value=[], 532 | message_type=None, enum_type=None, containing_type=None, 533 | is_extension=False, extension_scope=None, 534 | options=None, file=DESCRIPTOR), 535 | _descriptor.FieldDescriptor( 536 | name='relation', full_name='edu.stanford.nlp.pipeline.Sentence.relation', index=27, 537 | number=53, type=11, cpp_type=10, label=3, 538 | has_default_value=False, default_value=[], 539 | message_type=None, enum_type=None, containing_type=None, 540 | is_extension=False, extension_scope=None, 541 | options=None, file=DESCRIPTOR), 542 | _descriptor.FieldDescriptor( 543 | name='hasNumerizedTokensAnnotation', full_name='edu.stanford.nlp.pipeline.Sentence.hasNumerizedTokensAnnotation', index=28, 544 | number=54, type=8, cpp_type=7, label=1, 545 | has_default_value=False, default_value=False, 546 | message_type=None, enum_type=None, containing_type=None, 547 | is_extension=False, extension_scope=None, 548 | options=None, file=DESCRIPTOR), 549 | _descriptor.FieldDescriptor( 550 | name='mentions', full_name='edu.stanford.nlp.pipeline.Sentence.mentions', index=29, 551 | number=55, type=11, cpp_type=10, label=3, 552 | has_default_value=False, default_value=[], 553 | message_type=None, enum_type=None, containing_type=None, 554 | is_extension=False, extension_scope=None, 555 | options=None, file=DESCRIPTOR), 556 | _descriptor.FieldDescriptor( 557 | name='mentionsForCoref', full_name='edu.stanford.nlp.pipeline.Sentence.mentionsForCoref', index=30, 558 | number=56, type=11, cpp_type=10, label=3, 559 | has_default_value=False, default_value=[], 560 | message_type=None, enum_type=None, containing_type=None, 561 | is_extension=False, extension_scope=None, 562 | options=None, file=DESCRIPTOR), 563 | _descriptor.FieldDescriptor( 564 | name='hasCorefMentionsAnnotation', full_name='edu.stanford.nlp.pipeline.Sentence.hasCorefMentionsAnnotation', index=31, 565 | number=57, type=8, cpp_type=7, label=1, 566 | has_default_value=False, default_value=False, 567 | message_type=None, enum_type=None, containing_type=None, 568 | is_extension=False, extension_scope=None, 569 | options=None, file=DESCRIPTOR), 570 | _descriptor.FieldDescriptor( 571 | name='sentenceID', full_name='edu.stanford.nlp.pipeline.Sentence.sentenceID', index=32, 572 | number=58, type=9, cpp_type=9, label=1, 573 | has_default_value=False, default_value=_b("").decode('utf-8'), 574 | message_type=None, enum_type=None, containing_type=None, 575 | is_extension=False, extension_scope=None, 576 | options=None, file=DESCRIPTOR), 577 | _descriptor.FieldDescriptor( 578 | name='sectionDate', full_name='edu.stanford.nlp.pipeline.Sentence.sectionDate', index=33, 579 | number=59, type=9, cpp_type=9, label=1, 580 | has_default_value=False, default_value=_b("").decode('utf-8'), 581 | message_type=None, enum_type=None, containing_type=None, 582 | is_extension=False, extension_scope=None, 583 | options=None, file=DESCRIPTOR), 584 | _descriptor.FieldDescriptor( 585 | name='sectionIndex', full_name='edu.stanford.nlp.pipeline.Sentence.sectionIndex', index=34, 586 | number=60, type=13, cpp_type=3, label=1, 587 | has_default_value=False, default_value=0, 588 | message_type=None, enum_type=None, containing_type=None, 589 | is_extension=False, extension_scope=None, 590 | options=None, file=DESCRIPTOR), 591 | _descriptor.FieldDescriptor( 592 | name='sectionName', full_name='edu.stanford.nlp.pipeline.Sentence.sectionName', index=35, 593 | number=61, type=9, cpp_type=9, label=1, 594 | has_default_value=False, default_value=_b("").decode('utf-8'), 595 | message_type=None, enum_type=None, containing_type=None, 596 | is_extension=False, extension_scope=None, 597 | options=None, file=DESCRIPTOR), 598 | _descriptor.FieldDescriptor( 599 | name='sectionAuthor', full_name='edu.stanford.nlp.pipeline.Sentence.sectionAuthor', index=36, 600 | number=62, type=9, cpp_type=9, label=1, 601 | has_default_value=False, default_value=_b("").decode('utf-8'), 602 | message_type=None, enum_type=None, containing_type=None, 603 | is_extension=False, extension_scope=None, 604 | options=None, file=DESCRIPTOR), 605 | _descriptor.FieldDescriptor( 606 | name='docID', full_name='edu.stanford.nlp.pipeline.Sentence.docID', index=37, 607 | number=63, type=9, cpp_type=9, label=1, 608 | has_default_value=False, default_value=_b("").decode('utf-8'), 609 | message_type=None, enum_type=None, containing_type=None, 610 | is_extension=False, extension_scope=None, 611 | options=None, file=DESCRIPTOR), 612 | _descriptor.FieldDescriptor( 613 | name='sectionQuoted', full_name='edu.stanford.nlp.pipeline.Sentence.sectionQuoted', index=38, 614 | number=64, type=8, cpp_type=7, label=1, 615 | has_default_value=False, default_value=False, 616 | message_type=None, enum_type=None, containing_type=None, 617 | is_extension=False, extension_scope=None, 618 | options=None, file=DESCRIPTOR), 619 | _descriptor.FieldDescriptor( 620 | name='hasEntityMentionsAnnotation', full_name='edu.stanford.nlp.pipeline.Sentence.hasEntityMentionsAnnotation', index=39, 621 | number=65, type=8, cpp_type=7, label=1, 622 | has_default_value=False, default_value=False, 623 | message_type=None, enum_type=None, containing_type=None, 624 | is_extension=False, extension_scope=None, 625 | options=None, file=DESCRIPTOR), 626 | _descriptor.FieldDescriptor( 627 | name='hasKBPTriplesAnnotation', full_name='edu.stanford.nlp.pipeline.Sentence.hasKBPTriplesAnnotation', index=40, 628 | number=68, type=8, cpp_type=7, label=1, 629 | has_default_value=False, default_value=False, 630 | message_type=None, enum_type=None, containing_type=None, 631 | is_extension=False, extension_scope=None, 632 | options=None, file=DESCRIPTOR), 633 | _descriptor.FieldDescriptor( 634 | name='hasOpenieTriplesAnnotation', full_name='edu.stanford.nlp.pipeline.Sentence.hasOpenieTriplesAnnotation', index=41, 635 | number=69, type=8, cpp_type=7, label=1, 636 | has_default_value=False, default_value=False, 637 | message_type=None, enum_type=None, containing_type=None, 638 | is_extension=False, extension_scope=None, 639 | options=None, file=DESCRIPTOR), 640 | _descriptor.FieldDescriptor( 641 | name='chapterIndex', full_name='edu.stanford.nlp.pipeline.Sentence.chapterIndex', index=42, 642 | number=66, type=13, cpp_type=3, label=1, 643 | has_default_value=False, default_value=0, 644 | message_type=None, enum_type=None, containing_type=None, 645 | is_extension=False, extension_scope=None, 646 | options=None, file=DESCRIPTOR), 647 | _descriptor.FieldDescriptor( 648 | name='paragraphIndex', full_name='edu.stanford.nlp.pipeline.Sentence.paragraphIndex', index=43, 649 | number=67, type=13, cpp_type=3, label=1, 650 | has_default_value=False, default_value=0, 651 | message_type=None, enum_type=None, containing_type=None, 652 | is_extension=False, extension_scope=None, 653 | options=None, file=DESCRIPTOR), 654 | ], 655 | extensions=[ 656 | ], 657 | nested_types=[], 658 | enum_types=[ 659 | ], 660 | options=None, 661 | is_extendable=True, 662 | syntax='proto2', 663 | extension_ranges=[(100, 256), ], 664 | oneofs=[ 665 | ], 666 | serialized_start=785, 667 | serialized_end=2719, 668 | ) 669 | 670 | 671 | _TOKEN = _descriptor.Descriptor( 672 | name='Token', 673 | full_name='edu.stanford.nlp.pipeline.Token', 674 | filename=None, 675 | file=DESCRIPTOR, 676 | containing_type=None, 677 | fields=[ 678 | _descriptor.FieldDescriptor( 679 | name='word', full_name='edu.stanford.nlp.pipeline.Token.word', index=0, 680 | number=1, type=9, cpp_type=9, label=1, 681 | has_default_value=False, default_value=_b("").decode('utf-8'), 682 | message_type=None, enum_type=None, containing_type=None, 683 | is_extension=False, extension_scope=None, 684 | options=None, file=DESCRIPTOR), 685 | _descriptor.FieldDescriptor( 686 | name='pos', full_name='edu.stanford.nlp.pipeline.Token.pos', index=1, 687 | number=2, type=9, cpp_type=9, label=1, 688 | has_default_value=False, default_value=_b("").decode('utf-8'), 689 | message_type=None, enum_type=None, containing_type=None, 690 | is_extension=False, extension_scope=None, 691 | options=None, file=DESCRIPTOR), 692 | _descriptor.FieldDescriptor( 693 | name='value', full_name='edu.stanford.nlp.pipeline.Token.value', index=2, 694 | number=3, type=9, cpp_type=9, label=1, 695 | has_default_value=False, default_value=_b("").decode('utf-8'), 696 | message_type=None, enum_type=None, containing_type=None, 697 | is_extension=False, extension_scope=None, 698 | options=None, file=DESCRIPTOR), 699 | _descriptor.FieldDescriptor( 700 | name='category', full_name='edu.stanford.nlp.pipeline.Token.category', index=3, 701 | number=4, type=9, cpp_type=9, label=1, 702 | has_default_value=False, default_value=_b("").decode('utf-8'), 703 | message_type=None, enum_type=None, containing_type=None, 704 | is_extension=False, extension_scope=None, 705 | options=None, file=DESCRIPTOR), 706 | _descriptor.FieldDescriptor( 707 | name='before', full_name='edu.stanford.nlp.pipeline.Token.before', index=4, 708 | number=5, type=9, cpp_type=9, label=1, 709 | has_default_value=False, default_value=_b("").decode('utf-8'), 710 | message_type=None, enum_type=None, containing_type=None, 711 | is_extension=False, extension_scope=None, 712 | options=None, file=DESCRIPTOR), 713 | _descriptor.FieldDescriptor( 714 | name='after', full_name='edu.stanford.nlp.pipeline.Token.after', index=5, 715 | number=6, type=9, cpp_type=9, label=1, 716 | has_default_value=False, default_value=_b("").decode('utf-8'), 717 | message_type=None, enum_type=None, containing_type=None, 718 | is_extension=False, extension_scope=None, 719 | options=None, file=DESCRIPTOR), 720 | _descriptor.FieldDescriptor( 721 | name='originalText', full_name='edu.stanford.nlp.pipeline.Token.originalText', index=6, 722 | number=7, type=9, cpp_type=9, label=1, 723 | has_default_value=False, default_value=_b("").decode('utf-8'), 724 | message_type=None, enum_type=None, containing_type=None, 725 | is_extension=False, extension_scope=None, 726 | options=None, file=DESCRIPTOR), 727 | _descriptor.FieldDescriptor( 728 | name='ner', full_name='edu.stanford.nlp.pipeline.Token.ner', index=7, 729 | number=8, type=9, cpp_type=9, label=1, 730 | has_default_value=False, default_value=_b("").decode('utf-8'), 731 | message_type=None, enum_type=None, containing_type=None, 732 | is_extension=False, extension_scope=None, 733 | options=None, file=DESCRIPTOR), 734 | _descriptor.FieldDescriptor( 735 | name='coarseNER', full_name='edu.stanford.nlp.pipeline.Token.coarseNER', index=8, 736 | number=62, type=9, cpp_type=9, label=1, 737 | has_default_value=False, default_value=_b("").decode('utf-8'), 738 | message_type=None, enum_type=None, containing_type=None, 739 | is_extension=False, extension_scope=None, 740 | options=None, file=DESCRIPTOR), 741 | _descriptor.FieldDescriptor( 742 | name='fineGrainedNER', full_name='edu.stanford.nlp.pipeline.Token.fineGrainedNER', index=9, 743 | number=63, type=9, cpp_type=9, label=1, 744 | has_default_value=False, default_value=_b("").decode('utf-8'), 745 | message_type=None, enum_type=None, containing_type=None, 746 | is_extension=False, extension_scope=None, 747 | options=None, file=DESCRIPTOR), 748 | _descriptor.FieldDescriptor( 749 | name='normalizedNER', full_name='edu.stanford.nlp.pipeline.Token.normalizedNER', index=10, 750 | number=9, type=9, cpp_type=9, label=1, 751 | has_default_value=False, default_value=_b("").decode('utf-8'), 752 | message_type=None, enum_type=None, containing_type=None, 753 | is_extension=False, extension_scope=None, 754 | options=None, file=DESCRIPTOR), 755 | _descriptor.FieldDescriptor( 756 | name='lemma', full_name='edu.stanford.nlp.pipeline.Token.lemma', index=11, 757 | number=10, type=9, cpp_type=9, label=1, 758 | has_default_value=False, default_value=_b("").decode('utf-8'), 759 | message_type=None, enum_type=None, containing_type=None, 760 | is_extension=False, extension_scope=None, 761 | options=None, file=DESCRIPTOR), 762 | _descriptor.FieldDescriptor( 763 | name='beginChar', full_name='edu.stanford.nlp.pipeline.Token.beginChar', index=12, 764 | number=11, type=13, cpp_type=3, label=1, 765 | has_default_value=False, default_value=0, 766 | message_type=None, enum_type=None, containing_type=None, 767 | is_extension=False, extension_scope=None, 768 | options=None, file=DESCRIPTOR), 769 | _descriptor.FieldDescriptor( 770 | name='endChar', full_name='edu.stanford.nlp.pipeline.Token.endChar', index=13, 771 | number=12, type=13, cpp_type=3, label=1, 772 | has_default_value=False, default_value=0, 773 | message_type=None, enum_type=None, containing_type=None, 774 | is_extension=False, extension_scope=None, 775 | options=None, file=DESCRIPTOR), 776 | _descriptor.FieldDescriptor( 777 | name='utterance', full_name='edu.stanford.nlp.pipeline.Token.utterance', index=14, 778 | number=13, type=13, cpp_type=3, label=1, 779 | has_default_value=False, default_value=0, 780 | message_type=None, enum_type=None, containing_type=None, 781 | is_extension=False, extension_scope=None, 782 | options=None, file=DESCRIPTOR), 783 | _descriptor.FieldDescriptor( 784 | name='speaker', full_name='edu.stanford.nlp.pipeline.Token.speaker', index=15, 785 | number=14, type=9, cpp_type=9, label=1, 786 | has_default_value=False, default_value=_b("").decode('utf-8'), 787 | message_type=None, enum_type=None, containing_type=None, 788 | is_extension=False, extension_scope=None, 789 | options=None, file=DESCRIPTOR), 790 | _descriptor.FieldDescriptor( 791 | name='beginIndex', full_name='edu.stanford.nlp.pipeline.Token.beginIndex', index=16, 792 | number=15, type=13, cpp_type=3, label=1, 793 | has_default_value=False, default_value=0, 794 | message_type=None, enum_type=None, containing_type=None, 795 | is_extension=False, extension_scope=None, 796 | options=None, file=DESCRIPTOR), 797 | _descriptor.FieldDescriptor( 798 | name='endIndex', full_name='edu.stanford.nlp.pipeline.Token.endIndex', index=17, 799 | number=16, type=13, cpp_type=3, label=1, 800 | has_default_value=False, default_value=0, 801 | message_type=None, enum_type=None, containing_type=None, 802 | is_extension=False, extension_scope=None, 803 | options=None, file=DESCRIPTOR), 804 | _descriptor.FieldDescriptor( 805 | name='tokenBeginIndex', full_name='edu.stanford.nlp.pipeline.Token.tokenBeginIndex', index=18, 806 | number=17, type=13, cpp_type=3, label=1, 807 | has_default_value=False, default_value=0, 808 | message_type=None, enum_type=None, containing_type=None, 809 | is_extension=False, extension_scope=None, 810 | options=None, file=DESCRIPTOR), 811 | _descriptor.FieldDescriptor( 812 | name='tokenEndIndex', full_name='edu.stanford.nlp.pipeline.Token.tokenEndIndex', index=19, 813 | number=18, type=13, cpp_type=3, label=1, 814 | has_default_value=False, default_value=0, 815 | message_type=None, enum_type=None, containing_type=None, 816 | is_extension=False, extension_scope=None, 817 | options=None, file=DESCRIPTOR), 818 | _descriptor.FieldDescriptor( 819 | name='timexValue', full_name='edu.stanford.nlp.pipeline.Token.timexValue', index=20, 820 | number=19, type=11, cpp_type=10, label=1, 821 | has_default_value=False, default_value=None, 822 | message_type=None, enum_type=None, containing_type=None, 823 | is_extension=False, extension_scope=None, 824 | options=None, file=DESCRIPTOR), 825 | _descriptor.FieldDescriptor( 826 | name='hasXmlContext', full_name='edu.stanford.nlp.pipeline.Token.hasXmlContext', index=21, 827 | number=21, type=8, cpp_type=7, label=1, 828 | has_default_value=False, default_value=False, 829 | message_type=None, enum_type=None, containing_type=None, 830 | is_extension=False, extension_scope=None, 831 | options=None, file=DESCRIPTOR), 832 | _descriptor.FieldDescriptor( 833 | name='xmlContext', full_name='edu.stanford.nlp.pipeline.Token.xmlContext', index=22, 834 | number=22, type=9, cpp_type=9, label=3, 835 | has_default_value=False, default_value=[], 836 | message_type=None, enum_type=None, containing_type=None, 837 | is_extension=False, extension_scope=None, 838 | options=None, file=DESCRIPTOR), 839 | _descriptor.FieldDescriptor( 840 | name='corefClusterID', full_name='edu.stanford.nlp.pipeline.Token.corefClusterID', index=23, 841 | number=23, type=13, cpp_type=3, label=1, 842 | has_default_value=False, default_value=0, 843 | message_type=None, enum_type=None, containing_type=None, 844 | is_extension=False, extension_scope=None, 845 | options=None, file=DESCRIPTOR), 846 | _descriptor.FieldDescriptor( 847 | name='answer', full_name='edu.stanford.nlp.pipeline.Token.answer', index=24, 848 | number=24, type=9, cpp_type=9, label=1, 849 | has_default_value=False, default_value=_b("").decode('utf-8'), 850 | message_type=None, enum_type=None, containing_type=None, 851 | is_extension=False, extension_scope=None, 852 | options=None, file=DESCRIPTOR), 853 | _descriptor.FieldDescriptor( 854 | name='headWordIndex', full_name='edu.stanford.nlp.pipeline.Token.headWordIndex', index=25, 855 | number=26, type=13, cpp_type=3, label=1, 856 | has_default_value=False, default_value=0, 857 | message_type=None, enum_type=None, containing_type=None, 858 | is_extension=False, extension_scope=None, 859 | options=None, file=DESCRIPTOR), 860 | _descriptor.FieldDescriptor( 861 | name='operator', full_name='edu.stanford.nlp.pipeline.Token.operator', index=26, 862 | number=27, type=11, cpp_type=10, label=1, 863 | has_default_value=False, default_value=None, 864 | message_type=None, enum_type=None, containing_type=None, 865 | is_extension=False, extension_scope=None, 866 | options=None, file=DESCRIPTOR), 867 | _descriptor.FieldDescriptor( 868 | name='polarity', full_name='edu.stanford.nlp.pipeline.Token.polarity', index=27, 869 | number=28, type=11, cpp_type=10, label=1, 870 | has_default_value=False, default_value=None, 871 | message_type=None, enum_type=None, containing_type=None, 872 | is_extension=False, extension_scope=None, 873 | options=None, file=DESCRIPTOR), 874 | _descriptor.FieldDescriptor( 875 | name='polarity_dir', full_name='edu.stanford.nlp.pipeline.Token.polarity_dir', index=28, 876 | number=39, type=9, cpp_type=9, label=1, 877 | has_default_value=False, default_value=_b("").decode('utf-8'), 878 | message_type=None, enum_type=None, containing_type=None, 879 | is_extension=False, extension_scope=None, 880 | options=None, file=DESCRIPTOR), 881 | _descriptor.FieldDescriptor( 882 | name='span', full_name='edu.stanford.nlp.pipeline.Token.span', index=29, 883 | number=29, type=11, cpp_type=10, label=1, 884 | has_default_value=False, default_value=None, 885 | message_type=None, enum_type=None, containing_type=None, 886 | is_extension=False, extension_scope=None, 887 | options=None, file=DESCRIPTOR), 888 | _descriptor.FieldDescriptor( 889 | name='sentiment', full_name='edu.stanford.nlp.pipeline.Token.sentiment', index=30, 890 | number=30, type=9, cpp_type=9, label=1, 891 | has_default_value=False, default_value=_b("").decode('utf-8'), 892 | message_type=None, enum_type=None, containing_type=None, 893 | is_extension=False, extension_scope=None, 894 | options=None, file=DESCRIPTOR), 895 | _descriptor.FieldDescriptor( 896 | name='quotationIndex', full_name='edu.stanford.nlp.pipeline.Token.quotationIndex', index=31, 897 | number=31, type=5, cpp_type=1, label=1, 898 | has_default_value=False, default_value=0, 899 | message_type=None, enum_type=None, containing_type=None, 900 | is_extension=False, extension_scope=None, 901 | options=None, file=DESCRIPTOR), 902 | _descriptor.FieldDescriptor( 903 | name='conllUFeatures', full_name='edu.stanford.nlp.pipeline.Token.conllUFeatures', index=32, 904 | number=32, type=11, cpp_type=10, label=1, 905 | has_default_value=False, default_value=None, 906 | message_type=None, enum_type=None, containing_type=None, 907 | is_extension=False, extension_scope=None, 908 | options=None, file=DESCRIPTOR), 909 | _descriptor.FieldDescriptor( 910 | name='coarseTag', full_name='edu.stanford.nlp.pipeline.Token.coarseTag', index=33, 911 | number=33, type=9, cpp_type=9, label=1, 912 | has_default_value=False, default_value=_b("").decode('utf-8'), 913 | message_type=None, enum_type=None, containing_type=None, 914 | is_extension=False, extension_scope=None, 915 | options=None, file=DESCRIPTOR), 916 | _descriptor.FieldDescriptor( 917 | name='conllUTokenSpan', full_name='edu.stanford.nlp.pipeline.Token.conllUTokenSpan', index=34, 918 | number=34, type=11, cpp_type=10, label=1, 919 | has_default_value=False, default_value=None, 920 | message_type=None, enum_type=None, containing_type=None, 921 | is_extension=False, extension_scope=None, 922 | options=None, file=DESCRIPTOR), 923 | _descriptor.FieldDescriptor( 924 | name='conllUMisc', full_name='edu.stanford.nlp.pipeline.Token.conllUMisc', index=35, 925 | number=35, type=9, cpp_type=9, label=1, 926 | has_default_value=False, default_value=_b("").decode('utf-8'), 927 | message_type=None, enum_type=None, containing_type=None, 928 | is_extension=False, extension_scope=None, 929 | options=None, file=DESCRIPTOR), 930 | _descriptor.FieldDescriptor( 931 | name='conllUSecondaryDeps', full_name='edu.stanford.nlp.pipeline.Token.conllUSecondaryDeps', index=36, 932 | number=36, type=11, cpp_type=10, label=1, 933 | has_default_value=False, default_value=None, 934 | message_type=None, enum_type=None, containing_type=None, 935 | is_extension=False, extension_scope=None, 936 | options=None, file=DESCRIPTOR), 937 | _descriptor.FieldDescriptor( 938 | name='wikipediaEntity', full_name='edu.stanford.nlp.pipeline.Token.wikipediaEntity', index=37, 939 | number=37, type=9, cpp_type=9, label=1, 940 | has_default_value=False, default_value=_b("").decode('utf-8'), 941 | message_type=None, enum_type=None, containing_type=None, 942 | is_extension=False, extension_scope=None, 943 | options=None, file=DESCRIPTOR), 944 | _descriptor.FieldDescriptor( 945 | name='isNewline', full_name='edu.stanford.nlp.pipeline.Token.isNewline', index=38, 946 | number=38, type=8, cpp_type=7, label=1, 947 | has_default_value=False, default_value=False, 948 | message_type=None, enum_type=None, containing_type=None, 949 | is_extension=False, extension_scope=None, 950 | options=None, file=DESCRIPTOR), 951 | _descriptor.FieldDescriptor( 952 | name='gender', full_name='edu.stanford.nlp.pipeline.Token.gender', index=39, 953 | number=51, type=9, cpp_type=9, label=1, 954 | has_default_value=False, default_value=_b("").decode('utf-8'), 955 | message_type=None, enum_type=None, containing_type=None, 956 | is_extension=False, extension_scope=None, 957 | options=None, file=DESCRIPTOR), 958 | _descriptor.FieldDescriptor( 959 | name='trueCase', full_name='edu.stanford.nlp.pipeline.Token.trueCase', index=40, 960 | number=52, type=9, cpp_type=9, label=1, 961 | has_default_value=False, default_value=_b("").decode('utf-8'), 962 | message_type=None, enum_type=None, containing_type=None, 963 | is_extension=False, extension_scope=None, 964 | options=None, file=DESCRIPTOR), 965 | _descriptor.FieldDescriptor( 966 | name='trueCaseText', full_name='edu.stanford.nlp.pipeline.Token.trueCaseText', index=41, 967 | number=53, type=9, cpp_type=9, label=1, 968 | has_default_value=False, default_value=_b("").decode('utf-8'), 969 | message_type=None, enum_type=None, containing_type=None, 970 | is_extension=False, extension_scope=None, 971 | options=None, file=DESCRIPTOR), 972 | _descriptor.FieldDescriptor( 973 | name='chineseChar', full_name='edu.stanford.nlp.pipeline.Token.chineseChar', index=42, 974 | number=54, type=9, cpp_type=9, label=1, 975 | has_default_value=False, default_value=_b("").decode('utf-8'), 976 | message_type=None, enum_type=None, containing_type=None, 977 | is_extension=False, extension_scope=None, 978 | options=None, file=DESCRIPTOR), 979 | _descriptor.FieldDescriptor( 980 | name='chineseSeg', full_name='edu.stanford.nlp.pipeline.Token.chineseSeg', index=43, 981 | number=55, type=9, cpp_type=9, label=1, 982 | has_default_value=False, default_value=_b("").decode('utf-8'), 983 | message_type=None, enum_type=None, containing_type=None, 984 | is_extension=False, extension_scope=None, 985 | options=None, file=DESCRIPTOR), 986 | _descriptor.FieldDescriptor( 987 | name='chineseXMLChar', full_name='edu.stanford.nlp.pipeline.Token.chineseXMLChar', index=44, 988 | number=60, type=9, cpp_type=9, label=1, 989 | has_default_value=False, default_value=_b("").decode('utf-8'), 990 | message_type=None, enum_type=None, containing_type=None, 991 | is_extension=False, extension_scope=None, 992 | options=None, file=DESCRIPTOR), 993 | _descriptor.FieldDescriptor( 994 | name='sectionName', full_name='edu.stanford.nlp.pipeline.Token.sectionName', index=45, 995 | number=56, type=9, cpp_type=9, label=1, 996 | has_default_value=False, default_value=_b("").decode('utf-8'), 997 | message_type=None, enum_type=None, containing_type=None, 998 | is_extension=False, extension_scope=None, 999 | options=None, file=DESCRIPTOR), 1000 | _descriptor.FieldDescriptor( 1001 | name='sectionAuthor', full_name='edu.stanford.nlp.pipeline.Token.sectionAuthor', index=46, 1002 | number=57, type=9, cpp_type=9, label=1, 1003 | has_default_value=False, default_value=_b("").decode('utf-8'), 1004 | message_type=None, enum_type=None, containing_type=None, 1005 | is_extension=False, extension_scope=None, 1006 | options=None, file=DESCRIPTOR), 1007 | _descriptor.FieldDescriptor( 1008 | name='sectionDate', full_name='edu.stanford.nlp.pipeline.Token.sectionDate', index=47, 1009 | number=58, type=9, cpp_type=9, label=1, 1010 | has_default_value=False, default_value=_b("").decode('utf-8'), 1011 | message_type=None, enum_type=None, containing_type=None, 1012 | is_extension=False, extension_scope=None, 1013 | options=None, file=DESCRIPTOR), 1014 | _descriptor.FieldDescriptor( 1015 | name='sectionEndLabel', full_name='edu.stanford.nlp.pipeline.Token.sectionEndLabel', index=48, 1016 | number=59, type=9, cpp_type=9, label=1, 1017 | has_default_value=False, default_value=_b("").decode('utf-8'), 1018 | message_type=None, enum_type=None, containing_type=None, 1019 | is_extension=False, extension_scope=None, 1020 | options=None, file=DESCRIPTOR), 1021 | _descriptor.FieldDescriptor( 1022 | name='parent', full_name='edu.stanford.nlp.pipeline.Token.parent', index=49, 1023 | number=61, type=9, cpp_type=9, label=1, 1024 | has_default_value=False, default_value=_b("").decode('utf-8'), 1025 | message_type=None, enum_type=None, containing_type=None, 1026 | is_extension=False, extension_scope=None, 1027 | options=None, file=DESCRIPTOR), 1028 | _descriptor.FieldDescriptor( 1029 | name='corefMentionIndex', full_name='edu.stanford.nlp.pipeline.Token.corefMentionIndex', index=50, 1030 | number=64, type=13, cpp_type=3, label=3, 1031 | has_default_value=False, default_value=[], 1032 | message_type=None, enum_type=None, containing_type=None, 1033 | is_extension=False, extension_scope=None, 1034 | options=None, file=DESCRIPTOR), 1035 | _descriptor.FieldDescriptor( 1036 | name='entityMentionIndex', full_name='edu.stanford.nlp.pipeline.Token.entityMentionIndex', index=51, 1037 | number=65, type=13, cpp_type=3, label=1, 1038 | has_default_value=False, default_value=0, 1039 | message_type=None, enum_type=None, containing_type=None, 1040 | is_extension=False, extension_scope=None, 1041 | options=None, file=DESCRIPTOR), 1042 | ], 1043 | extensions=[ 1044 | ], 1045 | nested_types=[], 1046 | enum_types=[ 1047 | ], 1048 | options=None, 1049 | is_extendable=True, 1050 | syntax='proto2', 1051 | extension_ranges=[(100, 256), ], 1052 | oneofs=[ 1053 | ], 1054 | serialized_start=2722, 1055 | serialized_end=4047, 1056 | ) 1057 | 1058 | 1059 | _QUOTE = _descriptor.Descriptor( 1060 | name='Quote', 1061 | full_name='edu.stanford.nlp.pipeline.Quote', 1062 | filename=None, 1063 | file=DESCRIPTOR, 1064 | containing_type=None, 1065 | fields=[ 1066 | _descriptor.FieldDescriptor( 1067 | name='text', full_name='edu.stanford.nlp.pipeline.Quote.text', index=0, 1068 | number=1, type=9, cpp_type=9, label=1, 1069 | has_default_value=False, default_value=_b("").decode('utf-8'), 1070 | message_type=None, enum_type=None, containing_type=None, 1071 | is_extension=False, extension_scope=None, 1072 | options=None, file=DESCRIPTOR), 1073 | _descriptor.FieldDescriptor( 1074 | name='begin', full_name='edu.stanford.nlp.pipeline.Quote.begin', index=1, 1075 | number=2, type=13, cpp_type=3, label=1, 1076 | has_default_value=False, default_value=0, 1077 | message_type=None, enum_type=None, containing_type=None, 1078 | is_extension=False, extension_scope=None, 1079 | options=None, file=DESCRIPTOR), 1080 | _descriptor.FieldDescriptor( 1081 | name='end', full_name='edu.stanford.nlp.pipeline.Quote.end', index=2, 1082 | number=3, type=13, cpp_type=3, label=1, 1083 | has_default_value=False, default_value=0, 1084 | message_type=None, enum_type=None, containing_type=None, 1085 | is_extension=False, extension_scope=None, 1086 | options=None, file=DESCRIPTOR), 1087 | _descriptor.FieldDescriptor( 1088 | name='sentenceBegin', full_name='edu.stanford.nlp.pipeline.Quote.sentenceBegin', index=3, 1089 | number=5, type=13, cpp_type=3, label=1, 1090 | has_default_value=False, default_value=0, 1091 | message_type=None, enum_type=None, containing_type=None, 1092 | is_extension=False, extension_scope=None, 1093 | options=None, file=DESCRIPTOR), 1094 | _descriptor.FieldDescriptor( 1095 | name='sentenceEnd', full_name='edu.stanford.nlp.pipeline.Quote.sentenceEnd', index=4, 1096 | number=6, type=13, cpp_type=3, label=1, 1097 | has_default_value=False, default_value=0, 1098 | message_type=None, enum_type=None, containing_type=None, 1099 | is_extension=False, extension_scope=None, 1100 | options=None, file=DESCRIPTOR), 1101 | _descriptor.FieldDescriptor( 1102 | name='tokenBegin', full_name='edu.stanford.nlp.pipeline.Quote.tokenBegin', index=5, 1103 | number=7, type=13, cpp_type=3, label=1, 1104 | has_default_value=False, default_value=0, 1105 | message_type=None, enum_type=None, containing_type=None, 1106 | is_extension=False, extension_scope=None, 1107 | options=None, file=DESCRIPTOR), 1108 | _descriptor.FieldDescriptor( 1109 | name='tokenEnd', full_name='edu.stanford.nlp.pipeline.Quote.tokenEnd', index=6, 1110 | number=8, type=13, cpp_type=3, label=1, 1111 | has_default_value=False, default_value=0, 1112 | message_type=None, enum_type=None, containing_type=None, 1113 | is_extension=False, extension_scope=None, 1114 | options=None, file=DESCRIPTOR), 1115 | _descriptor.FieldDescriptor( 1116 | name='docid', full_name='edu.stanford.nlp.pipeline.Quote.docid', index=7, 1117 | number=9, type=9, cpp_type=9, label=1, 1118 | has_default_value=False, default_value=_b("").decode('utf-8'), 1119 | message_type=None, enum_type=None, containing_type=None, 1120 | is_extension=False, extension_scope=None, 1121 | options=None, file=DESCRIPTOR), 1122 | _descriptor.FieldDescriptor( 1123 | name='index', full_name='edu.stanford.nlp.pipeline.Quote.index', index=8, 1124 | number=10, type=13, cpp_type=3, label=1, 1125 | has_default_value=False, default_value=0, 1126 | message_type=None, enum_type=None, containing_type=None, 1127 | is_extension=False, extension_scope=None, 1128 | options=None, file=DESCRIPTOR), 1129 | _descriptor.FieldDescriptor( 1130 | name='author', full_name='edu.stanford.nlp.pipeline.Quote.author', index=9, 1131 | number=11, type=9, cpp_type=9, label=1, 1132 | has_default_value=False, default_value=_b("").decode('utf-8'), 1133 | message_type=None, enum_type=None, containing_type=None, 1134 | is_extension=False, extension_scope=None, 1135 | options=None, file=DESCRIPTOR), 1136 | _descriptor.FieldDescriptor( 1137 | name='mention', full_name='edu.stanford.nlp.pipeline.Quote.mention', index=10, 1138 | number=12, type=9, cpp_type=9, label=1, 1139 | has_default_value=False, default_value=_b("").decode('utf-8'), 1140 | message_type=None, enum_type=None, containing_type=None, 1141 | is_extension=False, extension_scope=None, 1142 | options=None, file=DESCRIPTOR), 1143 | _descriptor.FieldDescriptor( 1144 | name='mentionBegin', full_name='edu.stanford.nlp.pipeline.Quote.mentionBegin', index=11, 1145 | number=13, type=13, cpp_type=3, label=1, 1146 | has_default_value=False, default_value=0, 1147 | message_type=None, enum_type=None, containing_type=None, 1148 | is_extension=False, extension_scope=None, 1149 | options=None, file=DESCRIPTOR), 1150 | _descriptor.FieldDescriptor( 1151 | name='mentionEnd', full_name='edu.stanford.nlp.pipeline.Quote.mentionEnd', index=12, 1152 | number=14, type=13, cpp_type=3, label=1, 1153 | has_default_value=False, default_value=0, 1154 | message_type=None, enum_type=None, containing_type=None, 1155 | is_extension=False, extension_scope=None, 1156 | options=None, file=DESCRIPTOR), 1157 | _descriptor.FieldDescriptor( 1158 | name='mentionType', full_name='edu.stanford.nlp.pipeline.Quote.mentionType', index=13, 1159 | number=15, type=9, cpp_type=9, label=1, 1160 | has_default_value=False, default_value=_b("").decode('utf-8'), 1161 | message_type=None, enum_type=None, containing_type=None, 1162 | is_extension=False, extension_scope=None, 1163 | options=None, file=DESCRIPTOR), 1164 | _descriptor.FieldDescriptor( 1165 | name='mentionSieve', full_name='edu.stanford.nlp.pipeline.Quote.mentionSieve', index=14, 1166 | number=16, type=9, cpp_type=9, label=1, 1167 | has_default_value=False, default_value=_b("").decode('utf-8'), 1168 | message_type=None, enum_type=None, containing_type=None, 1169 | is_extension=False, extension_scope=None, 1170 | options=None, file=DESCRIPTOR), 1171 | _descriptor.FieldDescriptor( 1172 | name='speaker', full_name='edu.stanford.nlp.pipeline.Quote.speaker', index=15, 1173 | number=17, type=9, cpp_type=9, label=1, 1174 | has_default_value=False, default_value=_b("").decode('utf-8'), 1175 | message_type=None, enum_type=None, containing_type=None, 1176 | is_extension=False, extension_scope=None, 1177 | options=None, file=DESCRIPTOR), 1178 | _descriptor.FieldDescriptor( 1179 | name='speakerSieve', full_name='edu.stanford.nlp.pipeline.Quote.speakerSieve', index=16, 1180 | number=18, type=9, cpp_type=9, label=1, 1181 | has_default_value=False, default_value=_b("").decode('utf-8'), 1182 | message_type=None, enum_type=None, containing_type=None, 1183 | is_extension=False, extension_scope=None, 1184 | options=None, file=DESCRIPTOR), 1185 | _descriptor.FieldDescriptor( 1186 | name='canonicalMention', full_name='edu.stanford.nlp.pipeline.Quote.canonicalMention', index=17, 1187 | number=19, type=9, cpp_type=9, label=1, 1188 | has_default_value=False, default_value=_b("").decode('utf-8'), 1189 | message_type=None, enum_type=None, containing_type=None, 1190 | is_extension=False, extension_scope=None, 1191 | options=None, file=DESCRIPTOR), 1192 | _descriptor.FieldDescriptor( 1193 | name='canonicalMentionBegin', full_name='edu.stanford.nlp.pipeline.Quote.canonicalMentionBegin', index=18, 1194 | number=20, type=13, cpp_type=3, label=1, 1195 | has_default_value=False, default_value=0, 1196 | message_type=None, enum_type=None, containing_type=None, 1197 | is_extension=False, extension_scope=None, 1198 | options=None, file=DESCRIPTOR), 1199 | _descriptor.FieldDescriptor( 1200 | name='canonicalMentionEnd', full_name='edu.stanford.nlp.pipeline.Quote.canonicalMentionEnd', index=19, 1201 | number=21, type=13, cpp_type=3, label=1, 1202 | has_default_value=False, default_value=0, 1203 | message_type=None, enum_type=None, containing_type=None, 1204 | is_extension=False, extension_scope=None, 1205 | options=None, file=DESCRIPTOR), 1206 | _descriptor.FieldDescriptor( 1207 | name='attributionDependencyGraph', full_name='edu.stanford.nlp.pipeline.Quote.attributionDependencyGraph', index=20, 1208 | number=22, type=11, cpp_type=10, label=1, 1209 | has_default_value=False, default_value=None, 1210 | message_type=None, enum_type=None, containing_type=None, 1211 | is_extension=False, extension_scope=None, 1212 | options=None, file=DESCRIPTOR), 1213 | ], 1214 | extensions=[ 1215 | ], 1216 | nested_types=[], 1217 | enum_types=[ 1218 | ], 1219 | options=None, 1220 | is_extendable=False, 1221 | syntax='proto2', 1222 | extension_ranges=[], 1223 | oneofs=[ 1224 | ], 1225 | serialized_start=4050, 1226 | serialized_end=4534, 1227 | ) 1228 | 1229 | 1230 | _PARSETREE = _descriptor.Descriptor( 1231 | name='ParseTree', 1232 | full_name='edu.stanford.nlp.pipeline.ParseTree', 1233 | filename=None, 1234 | file=DESCRIPTOR, 1235 | containing_type=None, 1236 | fields=[ 1237 | _descriptor.FieldDescriptor( 1238 | name='child', full_name='edu.stanford.nlp.pipeline.ParseTree.child', index=0, 1239 | number=1, type=11, cpp_type=10, label=3, 1240 | has_default_value=False, default_value=[], 1241 | message_type=None, enum_type=None, containing_type=None, 1242 | is_extension=False, extension_scope=None, 1243 | options=None, file=DESCRIPTOR), 1244 | _descriptor.FieldDescriptor( 1245 | name='value', full_name='edu.stanford.nlp.pipeline.ParseTree.value', index=1, 1246 | number=2, type=9, cpp_type=9, label=1, 1247 | has_default_value=False, default_value=_b("").decode('utf-8'), 1248 | message_type=None, enum_type=None, containing_type=None, 1249 | is_extension=False, extension_scope=None, 1250 | options=None, file=DESCRIPTOR), 1251 | _descriptor.FieldDescriptor( 1252 | name='yieldBeginIndex', full_name='edu.stanford.nlp.pipeline.ParseTree.yieldBeginIndex', index=2, 1253 | number=3, type=13, cpp_type=3, label=1, 1254 | has_default_value=False, default_value=0, 1255 | message_type=None, enum_type=None, containing_type=None, 1256 | is_extension=False, extension_scope=None, 1257 | options=None, file=DESCRIPTOR), 1258 | _descriptor.FieldDescriptor( 1259 | name='yieldEndIndex', full_name='edu.stanford.nlp.pipeline.ParseTree.yieldEndIndex', index=3, 1260 | number=4, type=13, cpp_type=3, label=1, 1261 | has_default_value=False, default_value=0, 1262 | message_type=None, enum_type=None, containing_type=None, 1263 | is_extension=False, extension_scope=None, 1264 | options=None, file=DESCRIPTOR), 1265 | _descriptor.FieldDescriptor( 1266 | name='score', full_name='edu.stanford.nlp.pipeline.ParseTree.score', index=4, 1267 | number=5, type=1, cpp_type=5, label=1, 1268 | has_default_value=False, default_value=float(0), 1269 | message_type=None, enum_type=None, containing_type=None, 1270 | is_extension=False, extension_scope=None, 1271 | options=None, file=DESCRIPTOR), 1272 | _descriptor.FieldDescriptor( 1273 | name='sentiment', full_name='edu.stanford.nlp.pipeline.ParseTree.sentiment', index=5, 1274 | number=6, type=14, cpp_type=8, label=1, 1275 | has_default_value=False, default_value=0, 1276 | message_type=None, enum_type=None, containing_type=None, 1277 | is_extension=False, extension_scope=None, 1278 | options=None, file=DESCRIPTOR), 1279 | ], 1280 | extensions=[ 1281 | ], 1282 | nested_types=[], 1283 | enum_types=[ 1284 | ], 1285 | options=None, 1286 | is_extendable=False, 1287 | syntax='proto2', 1288 | extension_ranges=[], 1289 | oneofs=[ 1290 | ], 1291 | serialized_start=4537, 1292 | serialized_end=4736, 1293 | ) 1294 | 1295 | 1296 | _DEPENDENCYGRAPH_NODE = _descriptor.Descriptor( 1297 | name='Node', 1298 | full_name='edu.stanford.nlp.pipeline.DependencyGraph.Node', 1299 | filename=None, 1300 | file=DESCRIPTOR, 1301 | containing_type=None, 1302 | fields=[ 1303 | _descriptor.FieldDescriptor( 1304 | name='sentenceIndex', full_name='edu.stanford.nlp.pipeline.DependencyGraph.Node.sentenceIndex', index=0, 1305 | number=1, type=13, cpp_type=3, label=2, 1306 | has_default_value=False, default_value=0, 1307 | message_type=None, enum_type=None, containing_type=None, 1308 | is_extension=False, extension_scope=None, 1309 | options=None, file=DESCRIPTOR), 1310 | _descriptor.FieldDescriptor( 1311 | name='index', full_name='edu.stanford.nlp.pipeline.DependencyGraph.Node.index', index=1, 1312 | number=2, type=13, cpp_type=3, label=2, 1313 | has_default_value=False, default_value=0, 1314 | message_type=None, enum_type=None, containing_type=None, 1315 | is_extension=False, extension_scope=None, 1316 | options=None, file=DESCRIPTOR), 1317 | _descriptor.FieldDescriptor( 1318 | name='copyAnnotation', full_name='edu.stanford.nlp.pipeline.DependencyGraph.Node.copyAnnotation', index=2, 1319 | number=3, type=13, cpp_type=3, label=1, 1320 | has_default_value=False, default_value=0, 1321 | message_type=None, enum_type=None, containing_type=None, 1322 | is_extension=False, extension_scope=None, 1323 | options=None, file=DESCRIPTOR), 1324 | ], 1325 | extensions=[ 1326 | ], 1327 | nested_types=[], 1328 | enum_types=[ 1329 | ], 1330 | options=None, 1331 | is_extendable=False, 1332 | syntax='proto2', 1333 | extension_ranges=[], 1334 | oneofs=[ 1335 | ], 1336 | serialized_start=4902, 1337 | serialized_end=4970, 1338 | ) 1339 | 1340 | _DEPENDENCYGRAPH_EDGE = _descriptor.Descriptor( 1341 | name='Edge', 1342 | full_name='edu.stanford.nlp.pipeline.DependencyGraph.Edge', 1343 | filename=None, 1344 | file=DESCRIPTOR, 1345 | containing_type=None, 1346 | fields=[ 1347 | _descriptor.FieldDescriptor( 1348 | name='source', full_name='edu.stanford.nlp.pipeline.DependencyGraph.Edge.source', index=0, 1349 | number=1, type=13, cpp_type=3, label=2, 1350 | has_default_value=False, default_value=0, 1351 | message_type=None, enum_type=None, containing_type=None, 1352 | is_extension=False, extension_scope=None, 1353 | options=None, file=DESCRIPTOR), 1354 | _descriptor.FieldDescriptor( 1355 | name='target', full_name='edu.stanford.nlp.pipeline.DependencyGraph.Edge.target', index=1, 1356 | number=2, type=13, cpp_type=3, label=2, 1357 | has_default_value=False, default_value=0, 1358 | message_type=None, enum_type=None, containing_type=None, 1359 | is_extension=False, extension_scope=None, 1360 | options=None, file=DESCRIPTOR), 1361 | _descriptor.FieldDescriptor( 1362 | name='dep', full_name='edu.stanford.nlp.pipeline.DependencyGraph.Edge.dep', index=2, 1363 | number=3, type=9, cpp_type=9, label=1, 1364 | has_default_value=False, default_value=_b("").decode('utf-8'), 1365 | message_type=None, enum_type=None, containing_type=None, 1366 | is_extension=False, extension_scope=None, 1367 | options=None, file=DESCRIPTOR), 1368 | _descriptor.FieldDescriptor( 1369 | name='isExtra', full_name='edu.stanford.nlp.pipeline.DependencyGraph.Edge.isExtra', index=3, 1370 | number=4, type=8, cpp_type=7, label=1, 1371 | has_default_value=False, default_value=False, 1372 | message_type=None, enum_type=None, containing_type=None, 1373 | is_extension=False, extension_scope=None, 1374 | options=None, file=DESCRIPTOR), 1375 | _descriptor.FieldDescriptor( 1376 | name='sourceCopy', full_name='edu.stanford.nlp.pipeline.DependencyGraph.Edge.sourceCopy', index=4, 1377 | number=5, type=13, cpp_type=3, label=1, 1378 | has_default_value=False, default_value=0, 1379 | message_type=None, enum_type=None, containing_type=None, 1380 | is_extension=False, extension_scope=None, 1381 | options=None, file=DESCRIPTOR), 1382 | _descriptor.FieldDescriptor( 1383 | name='targetCopy', full_name='edu.stanford.nlp.pipeline.DependencyGraph.Edge.targetCopy', index=5, 1384 | number=6, type=13, cpp_type=3, label=1, 1385 | has_default_value=False, default_value=0, 1386 | message_type=None, enum_type=None, containing_type=None, 1387 | is_extension=False, extension_scope=None, 1388 | options=None, file=DESCRIPTOR), 1389 | _descriptor.FieldDescriptor( 1390 | name='language', full_name='edu.stanford.nlp.pipeline.DependencyGraph.Edge.language', index=6, 1391 | number=7, type=14, cpp_type=8, label=1, 1392 | has_default_value=True, default_value=0, 1393 | message_type=None, enum_type=None, containing_type=None, 1394 | is_extension=False, extension_scope=None, 1395 | options=None, file=DESCRIPTOR), 1396 | ], 1397 | extensions=[ 1398 | ], 1399 | nested_types=[], 1400 | enum_types=[ 1401 | ], 1402 | options=None, 1403 | is_extendable=False, 1404 | syntax='proto2', 1405 | extension_ranges=[], 1406 | oneofs=[ 1407 | ], 1408 | serialized_start=4973, 1409 | serialized_end=5145, 1410 | ) 1411 | 1412 | _DEPENDENCYGRAPH = _descriptor.Descriptor( 1413 | name='DependencyGraph', 1414 | full_name='edu.stanford.nlp.pipeline.DependencyGraph', 1415 | filename=None, 1416 | file=DESCRIPTOR, 1417 | containing_type=None, 1418 | fields=[ 1419 | _descriptor.FieldDescriptor( 1420 | name='node', full_name='edu.stanford.nlp.pipeline.DependencyGraph.node', index=0, 1421 | number=1, type=11, cpp_type=10, label=3, 1422 | has_default_value=False, default_value=[], 1423 | message_type=None, enum_type=None, containing_type=None, 1424 | is_extension=False, extension_scope=None, 1425 | options=None, file=DESCRIPTOR), 1426 | _descriptor.FieldDescriptor( 1427 | name='edge', full_name='edu.stanford.nlp.pipeline.DependencyGraph.edge', index=1, 1428 | number=2, type=11, cpp_type=10, label=3, 1429 | has_default_value=False, default_value=[], 1430 | message_type=None, enum_type=None, containing_type=None, 1431 | is_extension=False, extension_scope=None, 1432 | options=None, file=DESCRIPTOR), 1433 | _descriptor.FieldDescriptor( 1434 | name='root', full_name='edu.stanford.nlp.pipeline.DependencyGraph.root', index=2, 1435 | number=3, type=13, cpp_type=3, label=3, 1436 | has_default_value=False, default_value=[], 1437 | message_type=None, enum_type=None, containing_type=None, 1438 | is_extension=False, extension_scope=None, 1439 | options=_descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001')), file=DESCRIPTOR), 1440 | ], 1441 | extensions=[ 1442 | ], 1443 | nested_types=[_DEPENDENCYGRAPH_NODE, _DEPENDENCYGRAPH_EDGE, ], 1444 | enum_types=[ 1445 | ], 1446 | options=None, 1447 | is_extendable=False, 1448 | syntax='proto2', 1449 | extension_ranges=[], 1450 | oneofs=[ 1451 | ], 1452 | serialized_start=4739, 1453 | serialized_end=5145, 1454 | ) 1455 | 1456 | 1457 | _COREFCHAIN_COREFMENTION = _descriptor.Descriptor( 1458 | name='CorefMention', 1459 | full_name='edu.stanford.nlp.pipeline.CorefChain.CorefMention', 1460 | filename=None, 1461 | file=DESCRIPTOR, 1462 | containing_type=None, 1463 | fields=[ 1464 | _descriptor.FieldDescriptor( 1465 | name='mentionID', full_name='edu.stanford.nlp.pipeline.CorefChain.CorefMention.mentionID', index=0, 1466 | number=1, type=5, cpp_type=1, label=1, 1467 | has_default_value=False, default_value=0, 1468 | message_type=None, enum_type=None, containing_type=None, 1469 | is_extension=False, extension_scope=None, 1470 | options=None, file=DESCRIPTOR), 1471 | _descriptor.FieldDescriptor( 1472 | name='mentionType', full_name='edu.stanford.nlp.pipeline.CorefChain.CorefMention.mentionType', index=1, 1473 | number=2, type=9, cpp_type=9, label=1, 1474 | has_default_value=False, default_value=_b("").decode('utf-8'), 1475 | message_type=None, enum_type=None, containing_type=None, 1476 | is_extension=False, extension_scope=None, 1477 | options=None, file=DESCRIPTOR), 1478 | _descriptor.FieldDescriptor( 1479 | name='number', full_name='edu.stanford.nlp.pipeline.CorefChain.CorefMention.number', index=2, 1480 | number=3, type=9, cpp_type=9, label=1, 1481 | has_default_value=False, default_value=_b("").decode('utf-8'), 1482 | message_type=None, enum_type=None, containing_type=None, 1483 | is_extension=False, extension_scope=None, 1484 | options=None, file=DESCRIPTOR), 1485 | _descriptor.FieldDescriptor( 1486 | name='gender', full_name='edu.stanford.nlp.pipeline.CorefChain.CorefMention.gender', index=3, 1487 | number=4, type=9, cpp_type=9, label=1, 1488 | has_default_value=False, default_value=_b("").decode('utf-8'), 1489 | message_type=None, enum_type=None, containing_type=None, 1490 | is_extension=False, extension_scope=None, 1491 | options=None, file=DESCRIPTOR), 1492 | _descriptor.FieldDescriptor( 1493 | name='animacy', full_name='edu.stanford.nlp.pipeline.CorefChain.CorefMention.animacy', index=4, 1494 | number=5, type=9, cpp_type=9, label=1, 1495 | has_default_value=False, default_value=_b("").decode('utf-8'), 1496 | message_type=None, enum_type=None, containing_type=None, 1497 | is_extension=False, extension_scope=None, 1498 | options=None, file=DESCRIPTOR), 1499 | _descriptor.FieldDescriptor( 1500 | name='beginIndex', full_name='edu.stanford.nlp.pipeline.CorefChain.CorefMention.beginIndex', index=5, 1501 | number=6, type=13, cpp_type=3, label=1, 1502 | has_default_value=False, default_value=0, 1503 | message_type=None, enum_type=None, containing_type=None, 1504 | is_extension=False, extension_scope=None, 1505 | options=None, file=DESCRIPTOR), 1506 | _descriptor.FieldDescriptor( 1507 | name='endIndex', full_name='edu.stanford.nlp.pipeline.CorefChain.CorefMention.endIndex', index=6, 1508 | number=7, type=13, cpp_type=3, label=1, 1509 | has_default_value=False, default_value=0, 1510 | message_type=None, enum_type=None, containing_type=None, 1511 | is_extension=False, extension_scope=None, 1512 | options=None, file=DESCRIPTOR), 1513 | _descriptor.FieldDescriptor( 1514 | name='headIndex', full_name='edu.stanford.nlp.pipeline.CorefChain.CorefMention.headIndex', index=7, 1515 | number=9, type=13, cpp_type=3, label=1, 1516 | has_default_value=False, default_value=0, 1517 | message_type=None, enum_type=None, containing_type=None, 1518 | is_extension=False, extension_scope=None, 1519 | options=None, file=DESCRIPTOR), 1520 | _descriptor.FieldDescriptor( 1521 | name='sentenceIndex', full_name='edu.stanford.nlp.pipeline.CorefChain.CorefMention.sentenceIndex', index=8, 1522 | number=10, type=13, cpp_type=3, label=1, 1523 | has_default_value=False, default_value=0, 1524 | message_type=None, enum_type=None, containing_type=None, 1525 | is_extension=False, extension_scope=None, 1526 | options=None, file=DESCRIPTOR), 1527 | _descriptor.FieldDescriptor( 1528 | name='position', full_name='edu.stanford.nlp.pipeline.CorefChain.CorefMention.position', index=9, 1529 | number=11, type=13, cpp_type=3, label=1, 1530 | has_default_value=False, default_value=0, 1531 | message_type=None, enum_type=None, containing_type=None, 1532 | is_extension=False, extension_scope=None, 1533 | options=None, file=DESCRIPTOR), 1534 | ], 1535 | extensions=[ 1536 | ], 1537 | nested_types=[], 1538 | enum_types=[ 1539 | ], 1540 | options=None, 1541 | is_extendable=False, 1542 | syntax='proto2', 1543 | extension_ranges=[], 1544 | oneofs=[ 1545 | ], 1546 | serialized_start=5273, 1547 | serialized_end=5474, 1548 | ) 1549 | 1550 | _COREFCHAIN = _descriptor.Descriptor( 1551 | name='CorefChain', 1552 | full_name='edu.stanford.nlp.pipeline.CorefChain', 1553 | filename=None, 1554 | file=DESCRIPTOR, 1555 | containing_type=None, 1556 | fields=[ 1557 | _descriptor.FieldDescriptor( 1558 | name='chainID', full_name='edu.stanford.nlp.pipeline.CorefChain.chainID', index=0, 1559 | number=1, type=5, cpp_type=1, label=2, 1560 | has_default_value=False, default_value=0, 1561 | message_type=None, enum_type=None, containing_type=None, 1562 | is_extension=False, extension_scope=None, 1563 | options=None, file=DESCRIPTOR), 1564 | _descriptor.FieldDescriptor( 1565 | name='mention', full_name='edu.stanford.nlp.pipeline.CorefChain.mention', index=1, 1566 | number=2, type=11, cpp_type=10, label=3, 1567 | has_default_value=False, default_value=[], 1568 | message_type=None, enum_type=None, containing_type=None, 1569 | is_extension=False, extension_scope=None, 1570 | options=None, file=DESCRIPTOR), 1571 | _descriptor.FieldDescriptor( 1572 | name='representative', full_name='edu.stanford.nlp.pipeline.CorefChain.representative', index=2, 1573 | number=3, type=13, cpp_type=3, label=2, 1574 | has_default_value=False, default_value=0, 1575 | message_type=None, enum_type=None, containing_type=None, 1576 | is_extension=False, extension_scope=None, 1577 | options=None, file=DESCRIPTOR), 1578 | ], 1579 | extensions=[ 1580 | ], 1581 | nested_types=[_COREFCHAIN_COREFMENTION, ], 1582 | enum_types=[ 1583 | ], 1584 | options=None, 1585 | is_extendable=False, 1586 | syntax='proto2', 1587 | extension_ranges=[], 1588 | oneofs=[ 1589 | ], 1590 | serialized_start=5148, 1591 | serialized_end=5474, 1592 | ) 1593 | 1594 | 1595 | _MENTION = _descriptor.Descriptor( 1596 | name='Mention', 1597 | full_name='edu.stanford.nlp.pipeline.Mention', 1598 | filename=None, 1599 | file=DESCRIPTOR, 1600 | containing_type=None, 1601 | fields=[ 1602 | _descriptor.FieldDescriptor( 1603 | name='mentionID', full_name='edu.stanford.nlp.pipeline.Mention.mentionID', index=0, 1604 | number=1, type=5, cpp_type=1, label=1, 1605 | has_default_value=False, default_value=0, 1606 | message_type=None, enum_type=None, containing_type=None, 1607 | is_extension=False, extension_scope=None, 1608 | options=None, file=DESCRIPTOR), 1609 | _descriptor.FieldDescriptor( 1610 | name='mentionType', full_name='edu.stanford.nlp.pipeline.Mention.mentionType', index=1, 1611 | number=2, type=9, cpp_type=9, label=1, 1612 | has_default_value=False, default_value=_b("").decode('utf-8'), 1613 | message_type=None, enum_type=None, containing_type=None, 1614 | is_extension=False, extension_scope=None, 1615 | options=None, file=DESCRIPTOR), 1616 | _descriptor.FieldDescriptor( 1617 | name='number', full_name='edu.stanford.nlp.pipeline.Mention.number', index=2, 1618 | number=3, type=9, cpp_type=9, label=1, 1619 | has_default_value=False, default_value=_b("").decode('utf-8'), 1620 | message_type=None, enum_type=None, containing_type=None, 1621 | is_extension=False, extension_scope=None, 1622 | options=None, file=DESCRIPTOR), 1623 | _descriptor.FieldDescriptor( 1624 | name='gender', full_name='edu.stanford.nlp.pipeline.Mention.gender', index=3, 1625 | number=4, type=9, cpp_type=9, label=1, 1626 | has_default_value=False, default_value=_b("").decode('utf-8'), 1627 | message_type=None, enum_type=None, containing_type=None, 1628 | is_extension=False, extension_scope=None, 1629 | options=None, file=DESCRIPTOR), 1630 | _descriptor.FieldDescriptor( 1631 | name='animacy', full_name='edu.stanford.nlp.pipeline.Mention.animacy', index=4, 1632 | number=5, type=9, cpp_type=9, label=1, 1633 | has_default_value=False, default_value=_b("").decode('utf-8'), 1634 | message_type=None, enum_type=None, containing_type=None, 1635 | is_extension=False, extension_scope=None, 1636 | options=None, file=DESCRIPTOR), 1637 | _descriptor.FieldDescriptor( 1638 | name='person', full_name='edu.stanford.nlp.pipeline.Mention.person', index=5, 1639 | number=6, type=9, cpp_type=9, label=1, 1640 | has_default_value=False, default_value=_b("").decode('utf-8'), 1641 | message_type=None, enum_type=None, containing_type=None, 1642 | is_extension=False, extension_scope=None, 1643 | options=None, file=DESCRIPTOR), 1644 | _descriptor.FieldDescriptor( 1645 | name='startIndex', full_name='edu.stanford.nlp.pipeline.Mention.startIndex', index=6, 1646 | number=7, type=13, cpp_type=3, label=1, 1647 | has_default_value=False, default_value=0, 1648 | message_type=None, enum_type=None, containing_type=None, 1649 | is_extension=False, extension_scope=None, 1650 | options=None, file=DESCRIPTOR), 1651 | _descriptor.FieldDescriptor( 1652 | name='endIndex', full_name='edu.stanford.nlp.pipeline.Mention.endIndex', index=7, 1653 | number=9, type=13, cpp_type=3, label=1, 1654 | has_default_value=False, default_value=0, 1655 | message_type=None, enum_type=None, containing_type=None, 1656 | is_extension=False, extension_scope=None, 1657 | options=None, file=DESCRIPTOR), 1658 | _descriptor.FieldDescriptor( 1659 | name='headIndex', full_name='edu.stanford.nlp.pipeline.Mention.headIndex', index=8, 1660 | number=10, type=13, cpp_type=3, label=1, 1661 | has_default_value=False, default_value=0, 1662 | message_type=None, enum_type=None, containing_type=None, 1663 | is_extension=False, extension_scope=None, 1664 | options=None, file=DESCRIPTOR), 1665 | _descriptor.FieldDescriptor( 1666 | name='headString', full_name='edu.stanford.nlp.pipeline.Mention.headString', index=9, 1667 | number=11, type=9, cpp_type=9, label=1, 1668 | has_default_value=False, default_value=_b("").decode('utf-8'), 1669 | message_type=None, enum_type=None, containing_type=None, 1670 | is_extension=False, extension_scope=None, 1671 | options=None, file=DESCRIPTOR), 1672 | _descriptor.FieldDescriptor( 1673 | name='nerString', full_name='edu.stanford.nlp.pipeline.Mention.nerString', index=10, 1674 | number=12, type=9, cpp_type=9, label=1, 1675 | has_default_value=False, default_value=_b("").decode('utf-8'), 1676 | message_type=None, enum_type=None, containing_type=None, 1677 | is_extension=False, extension_scope=None, 1678 | options=None, file=DESCRIPTOR), 1679 | _descriptor.FieldDescriptor( 1680 | name='originalRef', full_name='edu.stanford.nlp.pipeline.Mention.originalRef', index=11, 1681 | number=13, type=13, cpp_type=3, label=1, 1682 | has_default_value=False, default_value=0, 1683 | message_type=None, enum_type=None, containing_type=None, 1684 | is_extension=False, extension_scope=None, 1685 | options=None, file=DESCRIPTOR), 1686 | _descriptor.FieldDescriptor( 1687 | name='goldCorefClusterID', full_name='edu.stanford.nlp.pipeline.Mention.goldCorefClusterID', index=12, 1688 | number=14, type=5, cpp_type=1, label=1, 1689 | has_default_value=False, default_value=0, 1690 | message_type=None, enum_type=None, containing_type=None, 1691 | is_extension=False, extension_scope=None, 1692 | options=None, file=DESCRIPTOR), 1693 | _descriptor.FieldDescriptor( 1694 | name='corefClusterID', full_name='edu.stanford.nlp.pipeline.Mention.corefClusterID', index=13, 1695 | number=15, type=5, cpp_type=1, label=1, 1696 | has_default_value=False, default_value=0, 1697 | message_type=None, enum_type=None, containing_type=None, 1698 | is_extension=False, extension_scope=None, 1699 | options=None, file=DESCRIPTOR), 1700 | _descriptor.FieldDescriptor( 1701 | name='mentionNum', full_name='edu.stanford.nlp.pipeline.Mention.mentionNum', index=14, 1702 | number=16, type=13, cpp_type=3, label=1, 1703 | has_default_value=False, default_value=0, 1704 | message_type=None, enum_type=None, containing_type=None, 1705 | is_extension=False, extension_scope=None, 1706 | options=None, file=DESCRIPTOR), 1707 | _descriptor.FieldDescriptor( 1708 | name='sentNum', full_name='edu.stanford.nlp.pipeline.Mention.sentNum', index=15, 1709 | number=17, type=13, cpp_type=3, label=1, 1710 | has_default_value=False, default_value=0, 1711 | message_type=None, enum_type=None, containing_type=None, 1712 | is_extension=False, extension_scope=None, 1713 | options=None, file=DESCRIPTOR), 1714 | _descriptor.FieldDescriptor( 1715 | name='utter', full_name='edu.stanford.nlp.pipeline.Mention.utter', index=16, 1716 | number=18, type=13, cpp_type=3, label=1, 1717 | has_default_value=False, default_value=0, 1718 | message_type=None, enum_type=None, containing_type=None, 1719 | is_extension=False, extension_scope=None, 1720 | options=None, file=DESCRIPTOR), 1721 | _descriptor.FieldDescriptor( 1722 | name='paragraph', full_name='edu.stanford.nlp.pipeline.Mention.paragraph', index=17, 1723 | number=19, type=13, cpp_type=3, label=1, 1724 | has_default_value=False, default_value=0, 1725 | message_type=None, enum_type=None, containing_type=None, 1726 | is_extension=False, extension_scope=None, 1727 | options=None, file=DESCRIPTOR), 1728 | _descriptor.FieldDescriptor( 1729 | name='isSubject', full_name='edu.stanford.nlp.pipeline.Mention.isSubject', index=18, 1730 | number=20, type=8, cpp_type=7, label=1, 1731 | has_default_value=False, default_value=False, 1732 | message_type=None, enum_type=None, containing_type=None, 1733 | is_extension=False, extension_scope=None, 1734 | options=None, file=DESCRIPTOR), 1735 | _descriptor.FieldDescriptor( 1736 | name='isDirectObject', full_name='edu.stanford.nlp.pipeline.Mention.isDirectObject', index=19, 1737 | number=21, type=8, cpp_type=7, label=1, 1738 | has_default_value=False, default_value=False, 1739 | message_type=None, enum_type=None, containing_type=None, 1740 | is_extension=False, extension_scope=None, 1741 | options=None, file=DESCRIPTOR), 1742 | _descriptor.FieldDescriptor( 1743 | name='isIndirectObject', full_name='edu.stanford.nlp.pipeline.Mention.isIndirectObject', index=20, 1744 | number=22, type=8, cpp_type=7, label=1, 1745 | has_default_value=False, default_value=False, 1746 | message_type=None, enum_type=None, containing_type=None, 1747 | is_extension=False, extension_scope=None, 1748 | options=None, file=DESCRIPTOR), 1749 | _descriptor.FieldDescriptor( 1750 | name='isPrepositionObject', full_name='edu.stanford.nlp.pipeline.Mention.isPrepositionObject', index=21, 1751 | number=23, type=8, cpp_type=7, label=1, 1752 | has_default_value=False, default_value=False, 1753 | message_type=None, enum_type=None, containing_type=None, 1754 | is_extension=False, extension_scope=None, 1755 | options=None, file=DESCRIPTOR), 1756 | _descriptor.FieldDescriptor( 1757 | name='hasTwin', full_name='edu.stanford.nlp.pipeline.Mention.hasTwin', index=22, 1758 | number=24, type=8, cpp_type=7, label=1, 1759 | has_default_value=False, default_value=False, 1760 | message_type=None, enum_type=None, containing_type=None, 1761 | is_extension=False, extension_scope=None, 1762 | options=None, file=DESCRIPTOR), 1763 | _descriptor.FieldDescriptor( 1764 | name='generic', full_name='edu.stanford.nlp.pipeline.Mention.generic', index=23, 1765 | number=25, type=8, cpp_type=7, label=1, 1766 | has_default_value=False, default_value=False, 1767 | message_type=None, enum_type=None, containing_type=None, 1768 | is_extension=False, extension_scope=None, 1769 | options=None, file=DESCRIPTOR), 1770 | _descriptor.FieldDescriptor( 1771 | name='isSingleton', full_name='edu.stanford.nlp.pipeline.Mention.isSingleton', index=24, 1772 | number=26, type=8, cpp_type=7, label=1, 1773 | has_default_value=False, default_value=False, 1774 | message_type=None, enum_type=None, containing_type=None, 1775 | is_extension=False, extension_scope=None, 1776 | options=None, file=DESCRIPTOR), 1777 | _descriptor.FieldDescriptor( 1778 | name='hasBasicDependency', full_name='edu.stanford.nlp.pipeline.Mention.hasBasicDependency', index=25, 1779 | number=27, type=8, cpp_type=7, label=1, 1780 | has_default_value=False, default_value=False, 1781 | message_type=None, enum_type=None, containing_type=None, 1782 | is_extension=False, extension_scope=None, 1783 | options=None, file=DESCRIPTOR), 1784 | _descriptor.FieldDescriptor( 1785 | name='hasEnhancedDepenedncy', full_name='edu.stanford.nlp.pipeline.Mention.hasEnhancedDepenedncy', index=26, 1786 | number=28, type=8, cpp_type=7, label=1, 1787 | has_default_value=False, default_value=False, 1788 | message_type=None, enum_type=None, containing_type=None, 1789 | is_extension=False, extension_scope=None, 1790 | options=None, file=DESCRIPTOR), 1791 | _descriptor.FieldDescriptor( 1792 | name='hasContextParseTree', full_name='edu.stanford.nlp.pipeline.Mention.hasContextParseTree', index=27, 1793 | number=29, type=8, cpp_type=7, label=1, 1794 | has_default_value=False, default_value=False, 1795 | message_type=None, enum_type=None, containing_type=None, 1796 | is_extension=False, extension_scope=None, 1797 | options=None, file=DESCRIPTOR), 1798 | _descriptor.FieldDescriptor( 1799 | name='headIndexedWord', full_name='edu.stanford.nlp.pipeline.Mention.headIndexedWord', index=28, 1800 | number=30, type=11, cpp_type=10, label=1, 1801 | has_default_value=False, default_value=None, 1802 | message_type=None, enum_type=None, containing_type=None, 1803 | is_extension=False, extension_scope=None, 1804 | options=None, file=DESCRIPTOR), 1805 | _descriptor.FieldDescriptor( 1806 | name='dependingVerb', full_name='edu.stanford.nlp.pipeline.Mention.dependingVerb', index=29, 1807 | number=31, type=11, cpp_type=10, label=1, 1808 | has_default_value=False, default_value=None, 1809 | message_type=None, enum_type=None, containing_type=None, 1810 | is_extension=False, extension_scope=None, 1811 | options=None, file=DESCRIPTOR), 1812 | _descriptor.FieldDescriptor( 1813 | name='headWord', full_name='edu.stanford.nlp.pipeline.Mention.headWord', index=30, 1814 | number=32, type=11, cpp_type=10, label=1, 1815 | has_default_value=False, default_value=None, 1816 | message_type=None, enum_type=None, containing_type=None, 1817 | is_extension=False, extension_scope=None, 1818 | options=None, file=DESCRIPTOR), 1819 | _descriptor.FieldDescriptor( 1820 | name='speakerInfo', full_name='edu.stanford.nlp.pipeline.Mention.speakerInfo', index=31, 1821 | number=33, type=11, cpp_type=10, label=1, 1822 | has_default_value=False, default_value=None, 1823 | message_type=None, enum_type=None, containing_type=None, 1824 | is_extension=False, extension_scope=None, 1825 | options=None, file=DESCRIPTOR), 1826 | _descriptor.FieldDescriptor( 1827 | name='sentenceWords', full_name='edu.stanford.nlp.pipeline.Mention.sentenceWords', index=32, 1828 | number=50, type=11, cpp_type=10, label=3, 1829 | has_default_value=False, default_value=[], 1830 | message_type=None, enum_type=None, containing_type=None, 1831 | is_extension=False, extension_scope=None, 1832 | options=None, file=DESCRIPTOR), 1833 | _descriptor.FieldDescriptor( 1834 | name='originalSpan', full_name='edu.stanford.nlp.pipeline.Mention.originalSpan', index=33, 1835 | number=51, type=11, cpp_type=10, label=3, 1836 | has_default_value=False, default_value=[], 1837 | message_type=None, enum_type=None, containing_type=None, 1838 | is_extension=False, extension_scope=None, 1839 | options=None, file=DESCRIPTOR), 1840 | _descriptor.FieldDescriptor( 1841 | name='dependents', full_name='edu.stanford.nlp.pipeline.Mention.dependents', index=34, 1842 | number=52, type=9, cpp_type=9, label=3, 1843 | has_default_value=False, default_value=[], 1844 | message_type=None, enum_type=None, containing_type=None, 1845 | is_extension=False, extension_scope=None, 1846 | options=None, file=DESCRIPTOR), 1847 | _descriptor.FieldDescriptor( 1848 | name='preprocessedTerms', full_name='edu.stanford.nlp.pipeline.Mention.preprocessedTerms', index=35, 1849 | number=53, type=9, cpp_type=9, label=3, 1850 | has_default_value=False, default_value=[], 1851 | message_type=None, enum_type=None, containing_type=None, 1852 | is_extension=False, extension_scope=None, 1853 | options=None, file=DESCRIPTOR), 1854 | _descriptor.FieldDescriptor( 1855 | name='appositions', full_name='edu.stanford.nlp.pipeline.Mention.appositions', index=36, 1856 | number=54, type=5, cpp_type=1, label=3, 1857 | has_default_value=False, default_value=[], 1858 | message_type=None, enum_type=None, containing_type=None, 1859 | is_extension=False, extension_scope=None, 1860 | options=None, file=DESCRIPTOR), 1861 | _descriptor.FieldDescriptor( 1862 | name='predicateNominatives', full_name='edu.stanford.nlp.pipeline.Mention.predicateNominatives', index=37, 1863 | number=55, type=5, cpp_type=1, label=3, 1864 | has_default_value=False, default_value=[], 1865 | message_type=None, enum_type=None, containing_type=None, 1866 | is_extension=False, extension_scope=None, 1867 | options=None, file=DESCRIPTOR), 1868 | _descriptor.FieldDescriptor( 1869 | name='relativePronouns', full_name='edu.stanford.nlp.pipeline.Mention.relativePronouns', index=38, 1870 | number=56, type=5, cpp_type=1, label=3, 1871 | has_default_value=False, default_value=[], 1872 | message_type=None, enum_type=None, containing_type=None, 1873 | is_extension=False, extension_scope=None, 1874 | options=None, file=DESCRIPTOR), 1875 | _descriptor.FieldDescriptor( 1876 | name='listMembers', full_name='edu.stanford.nlp.pipeline.Mention.listMembers', index=39, 1877 | number=57, type=5, cpp_type=1, label=3, 1878 | has_default_value=False, default_value=[], 1879 | message_type=None, enum_type=None, containing_type=None, 1880 | is_extension=False, extension_scope=None, 1881 | options=None, file=DESCRIPTOR), 1882 | _descriptor.FieldDescriptor( 1883 | name='belongToLists', full_name='edu.stanford.nlp.pipeline.Mention.belongToLists', index=40, 1884 | number=58, type=5, cpp_type=1, label=3, 1885 | has_default_value=False, default_value=[], 1886 | message_type=None, enum_type=None, containing_type=None, 1887 | is_extension=False, extension_scope=None, 1888 | options=None, file=DESCRIPTOR), 1889 | ], 1890 | extensions=[ 1891 | ], 1892 | nested_types=[], 1893 | enum_types=[ 1894 | ], 1895 | options=None, 1896 | is_extendable=False, 1897 | syntax='proto2', 1898 | extension_ranges=[], 1899 | oneofs=[ 1900 | ], 1901 | serialized_start=5477, 1902 | serialized_end=6612, 1903 | ) 1904 | 1905 | 1906 | _INDEXEDWORD = _descriptor.Descriptor( 1907 | name='IndexedWord', 1908 | full_name='edu.stanford.nlp.pipeline.IndexedWord', 1909 | filename=None, 1910 | file=DESCRIPTOR, 1911 | containing_type=None, 1912 | fields=[ 1913 | _descriptor.FieldDescriptor( 1914 | name='sentenceNum', full_name='edu.stanford.nlp.pipeline.IndexedWord.sentenceNum', index=0, 1915 | number=1, type=13, cpp_type=3, label=1, 1916 | has_default_value=False, default_value=0, 1917 | message_type=None, enum_type=None, containing_type=None, 1918 | is_extension=False, extension_scope=None, 1919 | options=None, file=DESCRIPTOR), 1920 | _descriptor.FieldDescriptor( 1921 | name='tokenIndex', full_name='edu.stanford.nlp.pipeline.IndexedWord.tokenIndex', index=1, 1922 | number=2, type=13, cpp_type=3, label=1, 1923 | has_default_value=False, default_value=0, 1924 | message_type=None, enum_type=None, containing_type=None, 1925 | is_extension=False, extension_scope=None, 1926 | options=None, file=DESCRIPTOR), 1927 | _descriptor.FieldDescriptor( 1928 | name='docID', full_name='edu.stanford.nlp.pipeline.IndexedWord.docID', index=2, 1929 | number=3, type=13, cpp_type=3, label=1, 1930 | has_default_value=False, default_value=0, 1931 | message_type=None, enum_type=None, containing_type=None, 1932 | is_extension=False, extension_scope=None, 1933 | options=None, file=DESCRIPTOR), 1934 | _descriptor.FieldDescriptor( 1935 | name='copyCount', full_name='edu.stanford.nlp.pipeline.IndexedWord.copyCount', index=3, 1936 | number=4, type=13, cpp_type=3, label=1, 1937 | has_default_value=False, default_value=0, 1938 | message_type=None, enum_type=None, containing_type=None, 1939 | is_extension=False, extension_scope=None, 1940 | options=None, file=DESCRIPTOR), 1941 | ], 1942 | extensions=[ 1943 | ], 1944 | nested_types=[], 1945 | enum_types=[ 1946 | ], 1947 | options=None, 1948 | is_extendable=False, 1949 | syntax='proto2', 1950 | extension_ranges=[], 1951 | oneofs=[ 1952 | ], 1953 | serialized_start=6614, 1954 | serialized_end=6702, 1955 | ) 1956 | 1957 | 1958 | _SPEAKERINFO = _descriptor.Descriptor( 1959 | name='SpeakerInfo', 1960 | full_name='edu.stanford.nlp.pipeline.SpeakerInfo', 1961 | filename=None, 1962 | file=DESCRIPTOR, 1963 | containing_type=None, 1964 | fields=[ 1965 | _descriptor.FieldDescriptor( 1966 | name='speakerName', full_name='edu.stanford.nlp.pipeline.SpeakerInfo.speakerName', index=0, 1967 | number=1, type=9, cpp_type=9, label=1, 1968 | has_default_value=False, default_value=_b("").decode('utf-8'), 1969 | message_type=None, enum_type=None, containing_type=None, 1970 | is_extension=False, extension_scope=None, 1971 | options=None, file=DESCRIPTOR), 1972 | _descriptor.FieldDescriptor( 1973 | name='mentions', full_name='edu.stanford.nlp.pipeline.SpeakerInfo.mentions', index=1, 1974 | number=2, type=5, cpp_type=1, label=3, 1975 | has_default_value=False, default_value=[], 1976 | message_type=None, enum_type=None, containing_type=None, 1977 | is_extension=False, extension_scope=None, 1978 | options=None, file=DESCRIPTOR), 1979 | ], 1980 | extensions=[ 1981 | ], 1982 | nested_types=[], 1983 | enum_types=[ 1984 | ], 1985 | options=None, 1986 | is_extendable=False, 1987 | syntax='proto2', 1988 | extension_ranges=[], 1989 | oneofs=[ 1990 | ], 1991 | serialized_start=6704, 1992 | serialized_end=6756, 1993 | ) 1994 | 1995 | 1996 | _SPAN = _descriptor.Descriptor( 1997 | name='Span', 1998 | full_name='edu.stanford.nlp.pipeline.Span', 1999 | filename=None, 2000 | file=DESCRIPTOR, 2001 | containing_type=None, 2002 | fields=[ 2003 | _descriptor.FieldDescriptor( 2004 | name='begin', full_name='edu.stanford.nlp.pipeline.Span.begin', index=0, 2005 | number=1, type=13, cpp_type=3, label=2, 2006 | has_default_value=False, default_value=0, 2007 | message_type=None, enum_type=None, containing_type=None, 2008 | is_extension=False, extension_scope=None, 2009 | options=None, file=DESCRIPTOR), 2010 | _descriptor.FieldDescriptor( 2011 | name='end', full_name='edu.stanford.nlp.pipeline.Span.end', index=1, 2012 | number=2, type=13, cpp_type=3, label=2, 2013 | has_default_value=False, default_value=0, 2014 | message_type=None, enum_type=None, containing_type=None, 2015 | is_extension=False, extension_scope=None, 2016 | options=None, file=DESCRIPTOR), 2017 | ], 2018 | extensions=[ 2019 | ], 2020 | nested_types=[], 2021 | enum_types=[ 2022 | ], 2023 | options=None, 2024 | is_extendable=False, 2025 | syntax='proto2', 2026 | extension_ranges=[], 2027 | oneofs=[ 2028 | ], 2029 | serialized_start=6758, 2030 | serialized_end=6792, 2031 | ) 2032 | 2033 | 2034 | _TIMEX = _descriptor.Descriptor( 2035 | name='Timex', 2036 | full_name='edu.stanford.nlp.pipeline.Timex', 2037 | filename=None, 2038 | file=DESCRIPTOR, 2039 | containing_type=None, 2040 | fields=[ 2041 | _descriptor.FieldDescriptor( 2042 | name='value', full_name='edu.stanford.nlp.pipeline.Timex.value', index=0, 2043 | number=1, type=9, cpp_type=9, label=1, 2044 | has_default_value=False, default_value=_b("").decode('utf-8'), 2045 | message_type=None, enum_type=None, containing_type=None, 2046 | is_extension=False, extension_scope=None, 2047 | options=None, file=DESCRIPTOR), 2048 | _descriptor.FieldDescriptor( 2049 | name='altValue', full_name='edu.stanford.nlp.pipeline.Timex.altValue', index=1, 2050 | number=2, type=9, cpp_type=9, label=1, 2051 | has_default_value=False, default_value=_b("").decode('utf-8'), 2052 | message_type=None, enum_type=None, containing_type=None, 2053 | is_extension=False, extension_scope=None, 2054 | options=None, file=DESCRIPTOR), 2055 | _descriptor.FieldDescriptor( 2056 | name='text', full_name='edu.stanford.nlp.pipeline.Timex.text', index=2, 2057 | number=3, type=9, cpp_type=9, label=1, 2058 | has_default_value=False, default_value=_b("").decode('utf-8'), 2059 | message_type=None, enum_type=None, containing_type=None, 2060 | is_extension=False, extension_scope=None, 2061 | options=None, file=DESCRIPTOR), 2062 | _descriptor.FieldDescriptor( 2063 | name='type', full_name='edu.stanford.nlp.pipeline.Timex.type', index=3, 2064 | number=4, type=9, cpp_type=9, label=1, 2065 | has_default_value=False, default_value=_b("").decode('utf-8'), 2066 | message_type=None, enum_type=None, containing_type=None, 2067 | is_extension=False, extension_scope=None, 2068 | options=None, file=DESCRIPTOR), 2069 | _descriptor.FieldDescriptor( 2070 | name='tid', full_name='edu.stanford.nlp.pipeline.Timex.tid', index=4, 2071 | number=5, type=9, cpp_type=9, label=1, 2072 | has_default_value=False, default_value=_b("").decode('utf-8'), 2073 | message_type=None, enum_type=None, containing_type=None, 2074 | is_extension=False, extension_scope=None, 2075 | options=None, file=DESCRIPTOR), 2076 | _descriptor.FieldDescriptor( 2077 | name='beginPoint', full_name='edu.stanford.nlp.pipeline.Timex.beginPoint', index=5, 2078 | number=6, type=13, cpp_type=3, label=1, 2079 | has_default_value=False, default_value=0, 2080 | message_type=None, enum_type=None, containing_type=None, 2081 | is_extension=False, extension_scope=None, 2082 | options=None, file=DESCRIPTOR), 2083 | _descriptor.FieldDescriptor( 2084 | name='endPoint', full_name='edu.stanford.nlp.pipeline.Timex.endPoint', index=6, 2085 | number=7, type=13, cpp_type=3, label=1, 2086 | has_default_value=False, default_value=0, 2087 | message_type=None, enum_type=None, containing_type=None, 2088 | is_extension=False, extension_scope=None, 2089 | options=None, file=DESCRIPTOR), 2090 | ], 2091 | extensions=[ 2092 | ], 2093 | nested_types=[], 2094 | enum_types=[ 2095 | ], 2096 | options=None, 2097 | is_extendable=False, 2098 | syntax='proto2', 2099 | extension_ranges=[], 2100 | oneofs=[ 2101 | ], 2102 | serialized_start=6794, 2103 | serialized_end=6913, 2104 | ) 2105 | 2106 | 2107 | _ENTITY = _descriptor.Descriptor( 2108 | name='Entity', 2109 | full_name='edu.stanford.nlp.pipeline.Entity', 2110 | filename=None, 2111 | file=DESCRIPTOR, 2112 | containing_type=None, 2113 | fields=[ 2114 | _descriptor.FieldDescriptor( 2115 | name='headStart', full_name='edu.stanford.nlp.pipeline.Entity.headStart', index=0, 2116 | number=6, type=13, cpp_type=3, label=1, 2117 | has_default_value=False, default_value=0, 2118 | message_type=None, enum_type=None, containing_type=None, 2119 | is_extension=False, extension_scope=None, 2120 | options=None, file=DESCRIPTOR), 2121 | _descriptor.FieldDescriptor( 2122 | name='headEnd', full_name='edu.stanford.nlp.pipeline.Entity.headEnd', index=1, 2123 | number=7, type=13, cpp_type=3, label=1, 2124 | has_default_value=False, default_value=0, 2125 | message_type=None, enum_type=None, containing_type=None, 2126 | is_extension=False, extension_scope=None, 2127 | options=None, file=DESCRIPTOR), 2128 | _descriptor.FieldDescriptor( 2129 | name='mentionType', full_name='edu.stanford.nlp.pipeline.Entity.mentionType', index=2, 2130 | number=8, type=9, cpp_type=9, label=1, 2131 | has_default_value=False, default_value=_b("").decode('utf-8'), 2132 | message_type=None, enum_type=None, containing_type=None, 2133 | is_extension=False, extension_scope=None, 2134 | options=None, file=DESCRIPTOR), 2135 | _descriptor.FieldDescriptor( 2136 | name='normalizedName', full_name='edu.stanford.nlp.pipeline.Entity.normalizedName', index=3, 2137 | number=9, type=9, cpp_type=9, label=1, 2138 | has_default_value=False, default_value=_b("").decode('utf-8'), 2139 | message_type=None, enum_type=None, containing_type=None, 2140 | is_extension=False, extension_scope=None, 2141 | options=None, file=DESCRIPTOR), 2142 | _descriptor.FieldDescriptor( 2143 | name='headTokenIndex', full_name='edu.stanford.nlp.pipeline.Entity.headTokenIndex', index=4, 2144 | number=10, type=13, cpp_type=3, label=1, 2145 | has_default_value=False, default_value=0, 2146 | message_type=None, enum_type=None, containing_type=None, 2147 | is_extension=False, extension_scope=None, 2148 | options=None, file=DESCRIPTOR), 2149 | _descriptor.FieldDescriptor( 2150 | name='corefID', full_name='edu.stanford.nlp.pipeline.Entity.corefID', index=5, 2151 | number=11, type=9, cpp_type=9, label=1, 2152 | has_default_value=False, default_value=_b("").decode('utf-8'), 2153 | message_type=None, enum_type=None, containing_type=None, 2154 | is_extension=False, extension_scope=None, 2155 | options=None, file=DESCRIPTOR), 2156 | _descriptor.FieldDescriptor( 2157 | name='objectID', full_name='edu.stanford.nlp.pipeline.Entity.objectID', index=6, 2158 | number=1, type=9, cpp_type=9, label=1, 2159 | has_default_value=False, default_value=_b("").decode('utf-8'), 2160 | message_type=None, enum_type=None, containing_type=None, 2161 | is_extension=False, extension_scope=None, 2162 | options=None, file=DESCRIPTOR), 2163 | _descriptor.FieldDescriptor( 2164 | name='extentStart', full_name='edu.stanford.nlp.pipeline.Entity.extentStart', index=7, 2165 | number=2, type=13, cpp_type=3, label=1, 2166 | has_default_value=False, default_value=0, 2167 | message_type=None, enum_type=None, containing_type=None, 2168 | is_extension=False, extension_scope=None, 2169 | options=None, file=DESCRIPTOR), 2170 | _descriptor.FieldDescriptor( 2171 | name='extentEnd', full_name='edu.stanford.nlp.pipeline.Entity.extentEnd', index=8, 2172 | number=3, type=13, cpp_type=3, label=1, 2173 | has_default_value=False, default_value=0, 2174 | message_type=None, enum_type=None, containing_type=None, 2175 | is_extension=False, extension_scope=None, 2176 | options=None, file=DESCRIPTOR), 2177 | _descriptor.FieldDescriptor( 2178 | name='type', full_name='edu.stanford.nlp.pipeline.Entity.type', index=9, 2179 | number=4, type=9, cpp_type=9, label=1, 2180 | has_default_value=False, default_value=_b("").decode('utf-8'), 2181 | message_type=None, enum_type=None, containing_type=None, 2182 | is_extension=False, extension_scope=None, 2183 | options=None, file=DESCRIPTOR), 2184 | _descriptor.FieldDescriptor( 2185 | name='subtype', full_name='edu.stanford.nlp.pipeline.Entity.subtype', index=10, 2186 | number=5, type=9, cpp_type=9, label=1, 2187 | has_default_value=False, default_value=_b("").decode('utf-8'), 2188 | message_type=None, enum_type=None, containing_type=None, 2189 | is_extension=False, extension_scope=None, 2190 | options=None, file=DESCRIPTOR), 2191 | ], 2192 | extensions=[ 2193 | ], 2194 | nested_types=[], 2195 | enum_types=[ 2196 | ], 2197 | options=None, 2198 | is_extendable=False, 2199 | syntax='proto2', 2200 | extension_ranges=[], 2201 | oneofs=[ 2202 | ], 2203 | serialized_start=6916, 2204 | serialized_end=7135, 2205 | ) 2206 | 2207 | 2208 | _RELATION = _descriptor.Descriptor( 2209 | name='Relation', 2210 | full_name='edu.stanford.nlp.pipeline.Relation', 2211 | filename=None, 2212 | file=DESCRIPTOR, 2213 | containing_type=None, 2214 | fields=[ 2215 | _descriptor.FieldDescriptor( 2216 | name='argName', full_name='edu.stanford.nlp.pipeline.Relation.argName', index=0, 2217 | number=6, type=9, cpp_type=9, label=3, 2218 | has_default_value=False, default_value=[], 2219 | message_type=None, enum_type=None, containing_type=None, 2220 | is_extension=False, extension_scope=None, 2221 | options=None, file=DESCRIPTOR), 2222 | _descriptor.FieldDescriptor( 2223 | name='arg', full_name='edu.stanford.nlp.pipeline.Relation.arg', index=1, 2224 | number=7, type=11, cpp_type=10, label=3, 2225 | has_default_value=False, default_value=[], 2226 | message_type=None, enum_type=None, containing_type=None, 2227 | is_extension=False, extension_scope=None, 2228 | options=None, file=DESCRIPTOR), 2229 | _descriptor.FieldDescriptor( 2230 | name='signature', full_name='edu.stanford.nlp.pipeline.Relation.signature', index=2, 2231 | number=8, type=9, cpp_type=9, label=1, 2232 | has_default_value=False, default_value=_b("").decode('utf-8'), 2233 | message_type=None, enum_type=None, containing_type=None, 2234 | is_extension=False, extension_scope=None, 2235 | options=None, file=DESCRIPTOR), 2236 | _descriptor.FieldDescriptor( 2237 | name='objectID', full_name='edu.stanford.nlp.pipeline.Relation.objectID', index=3, 2238 | number=1, type=9, cpp_type=9, label=1, 2239 | has_default_value=False, default_value=_b("").decode('utf-8'), 2240 | message_type=None, enum_type=None, containing_type=None, 2241 | is_extension=False, extension_scope=None, 2242 | options=None, file=DESCRIPTOR), 2243 | _descriptor.FieldDescriptor( 2244 | name='extentStart', full_name='edu.stanford.nlp.pipeline.Relation.extentStart', index=4, 2245 | number=2, type=13, cpp_type=3, label=1, 2246 | has_default_value=False, default_value=0, 2247 | message_type=None, enum_type=None, containing_type=None, 2248 | is_extension=False, extension_scope=None, 2249 | options=None, file=DESCRIPTOR), 2250 | _descriptor.FieldDescriptor( 2251 | name='extentEnd', full_name='edu.stanford.nlp.pipeline.Relation.extentEnd', index=5, 2252 | number=3, type=13, cpp_type=3, label=1, 2253 | has_default_value=False, default_value=0, 2254 | message_type=None, enum_type=None, containing_type=None, 2255 | is_extension=False, extension_scope=None, 2256 | options=None, file=DESCRIPTOR), 2257 | _descriptor.FieldDescriptor( 2258 | name='type', full_name='edu.stanford.nlp.pipeline.Relation.type', index=6, 2259 | number=4, type=9, cpp_type=9, label=1, 2260 | has_default_value=False, default_value=_b("").decode('utf-8'), 2261 | message_type=None, enum_type=None, containing_type=None, 2262 | is_extension=False, extension_scope=None, 2263 | options=None, file=DESCRIPTOR), 2264 | _descriptor.FieldDescriptor( 2265 | name='subtype', full_name='edu.stanford.nlp.pipeline.Relation.subtype', index=7, 2266 | number=5, type=9, cpp_type=9, label=1, 2267 | has_default_value=False, default_value=_b("").decode('utf-8'), 2268 | message_type=None, enum_type=None, containing_type=None, 2269 | is_extension=False, extension_scope=None, 2270 | options=None, file=DESCRIPTOR), 2271 | ], 2272 | extensions=[ 2273 | ], 2274 | nested_types=[], 2275 | enum_types=[ 2276 | ], 2277 | options=None, 2278 | is_extendable=False, 2279 | syntax='proto2', 2280 | extension_ranges=[], 2281 | oneofs=[ 2282 | ], 2283 | serialized_start=7138, 2284 | serialized_end=7321, 2285 | ) 2286 | 2287 | 2288 | _OPERATOR = _descriptor.Descriptor( 2289 | name='Operator', 2290 | full_name='edu.stanford.nlp.pipeline.Operator', 2291 | filename=None, 2292 | file=DESCRIPTOR, 2293 | containing_type=None, 2294 | fields=[ 2295 | _descriptor.FieldDescriptor( 2296 | name='name', full_name='edu.stanford.nlp.pipeline.Operator.name', index=0, 2297 | number=1, type=9, cpp_type=9, label=2, 2298 | has_default_value=False, default_value=_b("").decode('utf-8'), 2299 | message_type=None, enum_type=None, containing_type=None, 2300 | is_extension=False, extension_scope=None, 2301 | options=None, file=DESCRIPTOR), 2302 | _descriptor.FieldDescriptor( 2303 | name='quantifierSpanBegin', full_name='edu.stanford.nlp.pipeline.Operator.quantifierSpanBegin', index=1, 2304 | number=2, type=5, cpp_type=1, label=2, 2305 | has_default_value=False, default_value=0, 2306 | message_type=None, enum_type=None, containing_type=None, 2307 | is_extension=False, extension_scope=None, 2308 | options=None, file=DESCRIPTOR), 2309 | _descriptor.FieldDescriptor( 2310 | name='quantifierSpanEnd', full_name='edu.stanford.nlp.pipeline.Operator.quantifierSpanEnd', index=2, 2311 | number=3, type=5, cpp_type=1, label=2, 2312 | has_default_value=False, default_value=0, 2313 | message_type=None, enum_type=None, containing_type=None, 2314 | is_extension=False, extension_scope=None, 2315 | options=None, file=DESCRIPTOR), 2316 | _descriptor.FieldDescriptor( 2317 | name='subjectSpanBegin', full_name='edu.stanford.nlp.pipeline.Operator.subjectSpanBegin', index=3, 2318 | number=4, type=5, cpp_type=1, label=2, 2319 | has_default_value=False, default_value=0, 2320 | message_type=None, enum_type=None, containing_type=None, 2321 | is_extension=False, extension_scope=None, 2322 | options=None, file=DESCRIPTOR), 2323 | _descriptor.FieldDescriptor( 2324 | name='subjectSpanEnd', full_name='edu.stanford.nlp.pipeline.Operator.subjectSpanEnd', index=4, 2325 | number=5, type=5, cpp_type=1, label=2, 2326 | has_default_value=False, default_value=0, 2327 | message_type=None, enum_type=None, containing_type=None, 2328 | is_extension=False, extension_scope=None, 2329 | options=None, file=DESCRIPTOR), 2330 | _descriptor.FieldDescriptor( 2331 | name='objectSpanBegin', full_name='edu.stanford.nlp.pipeline.Operator.objectSpanBegin', index=5, 2332 | number=6, type=5, cpp_type=1, label=2, 2333 | has_default_value=False, default_value=0, 2334 | message_type=None, enum_type=None, containing_type=None, 2335 | is_extension=False, extension_scope=None, 2336 | options=None, file=DESCRIPTOR), 2337 | _descriptor.FieldDescriptor( 2338 | name='objectSpanEnd', full_name='edu.stanford.nlp.pipeline.Operator.objectSpanEnd', index=6, 2339 | number=7, type=5, cpp_type=1, label=2, 2340 | has_default_value=False, default_value=0, 2341 | message_type=None, enum_type=None, containing_type=None, 2342 | is_extension=False, extension_scope=None, 2343 | options=None, file=DESCRIPTOR), 2344 | ], 2345 | extensions=[ 2346 | ], 2347 | nested_types=[], 2348 | enum_types=[ 2349 | ], 2350 | options=None, 2351 | is_extendable=False, 2352 | syntax='proto2', 2353 | extension_ranges=[], 2354 | oneofs=[ 2355 | ], 2356 | serialized_start=7324, 2357 | serialized_end=7502, 2358 | ) 2359 | 2360 | 2361 | _POLARITY = _descriptor.Descriptor( 2362 | name='Polarity', 2363 | full_name='edu.stanford.nlp.pipeline.Polarity', 2364 | filename=None, 2365 | file=DESCRIPTOR, 2366 | containing_type=None, 2367 | fields=[ 2368 | _descriptor.FieldDescriptor( 2369 | name='projectEquivalence', full_name='edu.stanford.nlp.pipeline.Polarity.projectEquivalence', index=0, 2370 | number=1, type=14, cpp_type=8, label=2, 2371 | has_default_value=False, default_value=0, 2372 | message_type=None, enum_type=None, containing_type=None, 2373 | is_extension=False, extension_scope=None, 2374 | options=None, file=DESCRIPTOR), 2375 | _descriptor.FieldDescriptor( 2376 | name='projectForwardEntailment', full_name='edu.stanford.nlp.pipeline.Polarity.projectForwardEntailment', index=1, 2377 | number=2, type=14, cpp_type=8, label=2, 2378 | has_default_value=False, default_value=0, 2379 | message_type=None, enum_type=None, containing_type=None, 2380 | is_extension=False, extension_scope=None, 2381 | options=None, file=DESCRIPTOR), 2382 | _descriptor.FieldDescriptor( 2383 | name='projectReverseEntailment', full_name='edu.stanford.nlp.pipeline.Polarity.projectReverseEntailment', index=2, 2384 | number=3, type=14, cpp_type=8, label=2, 2385 | has_default_value=False, default_value=0, 2386 | message_type=None, enum_type=None, containing_type=None, 2387 | is_extension=False, extension_scope=None, 2388 | options=None, file=DESCRIPTOR), 2389 | _descriptor.FieldDescriptor( 2390 | name='projectNegation', full_name='edu.stanford.nlp.pipeline.Polarity.projectNegation', index=3, 2391 | number=4, type=14, cpp_type=8, label=2, 2392 | has_default_value=False, default_value=0, 2393 | message_type=None, enum_type=None, containing_type=None, 2394 | is_extension=False, extension_scope=None, 2395 | options=None, file=DESCRIPTOR), 2396 | _descriptor.FieldDescriptor( 2397 | name='projectAlternation', full_name='edu.stanford.nlp.pipeline.Polarity.projectAlternation', index=4, 2398 | number=5, type=14, cpp_type=8, label=2, 2399 | has_default_value=False, default_value=0, 2400 | message_type=None, enum_type=None, containing_type=None, 2401 | is_extension=False, extension_scope=None, 2402 | options=None, file=DESCRIPTOR), 2403 | _descriptor.FieldDescriptor( 2404 | name='projectCover', full_name='edu.stanford.nlp.pipeline.Polarity.projectCover', index=5, 2405 | number=6, type=14, cpp_type=8, label=2, 2406 | has_default_value=False, default_value=0, 2407 | message_type=None, enum_type=None, containing_type=None, 2408 | is_extension=False, extension_scope=None, 2409 | options=None, file=DESCRIPTOR), 2410 | _descriptor.FieldDescriptor( 2411 | name='projectIndependence', full_name='edu.stanford.nlp.pipeline.Polarity.projectIndependence', index=6, 2412 | number=7, type=14, cpp_type=8, label=2, 2413 | has_default_value=False, default_value=0, 2414 | message_type=None, enum_type=None, containing_type=None, 2415 | is_extension=False, extension_scope=None, 2416 | options=None, file=DESCRIPTOR), 2417 | ], 2418 | extensions=[ 2419 | ], 2420 | nested_types=[], 2421 | enum_types=[ 2422 | ], 2423 | options=None, 2424 | is_extendable=False, 2425 | syntax='proto2', 2426 | extension_ranges=[], 2427 | oneofs=[ 2428 | ], 2429 | serialized_start=7505, 2430 | serialized_end=8058, 2431 | ) 2432 | 2433 | 2434 | _NERMENTION = _descriptor.Descriptor( 2435 | name='NERMention', 2436 | full_name='edu.stanford.nlp.pipeline.NERMention', 2437 | filename=None, 2438 | file=DESCRIPTOR, 2439 | containing_type=None, 2440 | fields=[ 2441 | _descriptor.FieldDescriptor( 2442 | name='sentenceIndex', full_name='edu.stanford.nlp.pipeline.NERMention.sentenceIndex', index=0, 2443 | number=1, type=13, cpp_type=3, label=1, 2444 | has_default_value=False, default_value=0, 2445 | message_type=None, enum_type=None, containing_type=None, 2446 | is_extension=False, extension_scope=None, 2447 | options=None, file=DESCRIPTOR), 2448 | _descriptor.FieldDescriptor( 2449 | name='tokenStartInSentenceInclusive', full_name='edu.stanford.nlp.pipeline.NERMention.tokenStartInSentenceInclusive', index=1, 2450 | number=2, type=13, cpp_type=3, label=2, 2451 | has_default_value=False, default_value=0, 2452 | message_type=None, enum_type=None, containing_type=None, 2453 | is_extension=False, extension_scope=None, 2454 | options=None, file=DESCRIPTOR), 2455 | _descriptor.FieldDescriptor( 2456 | name='tokenEndInSentenceExclusive', full_name='edu.stanford.nlp.pipeline.NERMention.tokenEndInSentenceExclusive', index=2, 2457 | number=3, type=13, cpp_type=3, label=2, 2458 | has_default_value=False, default_value=0, 2459 | message_type=None, enum_type=None, containing_type=None, 2460 | is_extension=False, extension_scope=None, 2461 | options=None, file=DESCRIPTOR), 2462 | _descriptor.FieldDescriptor( 2463 | name='ner', full_name='edu.stanford.nlp.pipeline.NERMention.ner', index=3, 2464 | number=4, type=9, cpp_type=9, label=2, 2465 | has_default_value=False, default_value=_b("").decode('utf-8'), 2466 | message_type=None, enum_type=None, containing_type=None, 2467 | is_extension=False, extension_scope=None, 2468 | options=None, file=DESCRIPTOR), 2469 | _descriptor.FieldDescriptor( 2470 | name='normalizedNER', full_name='edu.stanford.nlp.pipeline.NERMention.normalizedNER', index=4, 2471 | number=5, type=9, cpp_type=9, label=1, 2472 | has_default_value=False, default_value=_b("").decode('utf-8'), 2473 | message_type=None, enum_type=None, containing_type=None, 2474 | is_extension=False, extension_scope=None, 2475 | options=None, file=DESCRIPTOR), 2476 | _descriptor.FieldDescriptor( 2477 | name='entityType', full_name='edu.stanford.nlp.pipeline.NERMention.entityType', index=5, 2478 | number=6, type=9, cpp_type=9, label=1, 2479 | has_default_value=False, default_value=_b("").decode('utf-8'), 2480 | message_type=None, enum_type=None, containing_type=None, 2481 | is_extension=False, extension_scope=None, 2482 | options=None, file=DESCRIPTOR), 2483 | _descriptor.FieldDescriptor( 2484 | name='timex', full_name='edu.stanford.nlp.pipeline.NERMention.timex', index=6, 2485 | number=7, type=11, cpp_type=10, label=1, 2486 | has_default_value=False, default_value=None, 2487 | message_type=None, enum_type=None, containing_type=None, 2488 | is_extension=False, extension_scope=None, 2489 | options=None, file=DESCRIPTOR), 2490 | _descriptor.FieldDescriptor( 2491 | name='wikipediaEntity', full_name='edu.stanford.nlp.pipeline.NERMention.wikipediaEntity', index=7, 2492 | number=8, type=9, cpp_type=9, label=1, 2493 | has_default_value=False, default_value=_b("").decode('utf-8'), 2494 | message_type=None, enum_type=None, containing_type=None, 2495 | is_extension=False, extension_scope=None, 2496 | options=None, file=DESCRIPTOR), 2497 | _descriptor.FieldDescriptor( 2498 | name='gender', full_name='edu.stanford.nlp.pipeline.NERMention.gender', index=8, 2499 | number=9, type=9, cpp_type=9, label=1, 2500 | has_default_value=False, default_value=_b("").decode('utf-8'), 2501 | message_type=None, enum_type=None, containing_type=None, 2502 | is_extension=False, extension_scope=None, 2503 | options=None, file=DESCRIPTOR), 2504 | _descriptor.FieldDescriptor( 2505 | name='entityMentionIndex', full_name='edu.stanford.nlp.pipeline.NERMention.entityMentionIndex', index=9, 2506 | number=10, type=13, cpp_type=3, label=1, 2507 | has_default_value=False, default_value=0, 2508 | message_type=None, enum_type=None, containing_type=None, 2509 | is_extension=False, extension_scope=None, 2510 | options=None, file=DESCRIPTOR), 2511 | _descriptor.FieldDescriptor( 2512 | name='canonicalEntityMentionIndex', full_name='edu.stanford.nlp.pipeline.NERMention.canonicalEntityMentionIndex', index=10, 2513 | number=11, type=13, cpp_type=3, label=1, 2514 | has_default_value=False, default_value=0, 2515 | message_type=None, enum_type=None, containing_type=None, 2516 | is_extension=False, extension_scope=None, 2517 | options=None, file=DESCRIPTOR), 2518 | _descriptor.FieldDescriptor( 2519 | name='entityMentionText', full_name='edu.stanford.nlp.pipeline.NERMention.entityMentionText', index=11, 2520 | number=12, type=9, cpp_type=9, label=1, 2521 | has_default_value=False, default_value=_b("").decode('utf-8'), 2522 | message_type=None, enum_type=None, containing_type=None, 2523 | is_extension=False, extension_scope=None, 2524 | options=None, file=DESCRIPTOR), 2525 | ], 2526 | extensions=[ 2527 | ], 2528 | nested_types=[], 2529 | enum_types=[ 2530 | ], 2531 | options=None, 2532 | is_extendable=False, 2533 | syntax='proto2', 2534 | extension_ranges=[], 2535 | oneofs=[ 2536 | ], 2537 | serialized_start=8061, 2538 | serialized_end=8410, 2539 | ) 2540 | 2541 | 2542 | _SENTENCEFRAGMENT = _descriptor.Descriptor( 2543 | name='SentenceFragment', 2544 | full_name='edu.stanford.nlp.pipeline.SentenceFragment', 2545 | filename=None, 2546 | file=DESCRIPTOR, 2547 | containing_type=None, 2548 | fields=[ 2549 | _descriptor.FieldDescriptor( 2550 | name='tokenIndex', full_name='edu.stanford.nlp.pipeline.SentenceFragment.tokenIndex', index=0, 2551 | number=1, type=13, cpp_type=3, label=3, 2552 | has_default_value=False, default_value=[], 2553 | message_type=None, enum_type=None, containing_type=None, 2554 | is_extension=False, extension_scope=None, 2555 | options=None, file=DESCRIPTOR), 2556 | _descriptor.FieldDescriptor( 2557 | name='root', full_name='edu.stanford.nlp.pipeline.SentenceFragment.root', index=1, 2558 | number=2, type=13, cpp_type=3, label=1, 2559 | has_default_value=False, default_value=0, 2560 | message_type=None, enum_type=None, containing_type=None, 2561 | is_extension=False, extension_scope=None, 2562 | options=None, file=DESCRIPTOR), 2563 | _descriptor.FieldDescriptor( 2564 | name='assumedTruth', full_name='edu.stanford.nlp.pipeline.SentenceFragment.assumedTruth', index=2, 2565 | number=3, type=8, cpp_type=7, label=1, 2566 | has_default_value=False, default_value=False, 2567 | message_type=None, enum_type=None, containing_type=None, 2568 | is_extension=False, extension_scope=None, 2569 | options=None, file=DESCRIPTOR), 2570 | _descriptor.FieldDescriptor( 2571 | name='score', full_name='edu.stanford.nlp.pipeline.SentenceFragment.score', index=3, 2572 | number=4, type=1, cpp_type=5, label=1, 2573 | has_default_value=False, default_value=float(0), 2574 | message_type=None, enum_type=None, containing_type=None, 2575 | is_extension=False, extension_scope=None, 2576 | options=None, file=DESCRIPTOR), 2577 | ], 2578 | extensions=[ 2579 | ], 2580 | nested_types=[], 2581 | enum_types=[ 2582 | ], 2583 | options=None, 2584 | is_extendable=False, 2585 | syntax='proto2', 2586 | extension_ranges=[], 2587 | oneofs=[ 2588 | ], 2589 | serialized_start=8412, 2590 | serialized_end=8501, 2591 | ) 2592 | 2593 | 2594 | _TOKENLOCATION = _descriptor.Descriptor( 2595 | name='TokenLocation', 2596 | full_name='edu.stanford.nlp.pipeline.TokenLocation', 2597 | filename=None, 2598 | file=DESCRIPTOR, 2599 | containing_type=None, 2600 | fields=[ 2601 | _descriptor.FieldDescriptor( 2602 | name='sentenceIndex', full_name='edu.stanford.nlp.pipeline.TokenLocation.sentenceIndex', index=0, 2603 | number=1, type=13, cpp_type=3, label=1, 2604 | has_default_value=False, default_value=0, 2605 | message_type=None, enum_type=None, containing_type=None, 2606 | is_extension=False, extension_scope=None, 2607 | options=None, file=DESCRIPTOR), 2608 | _descriptor.FieldDescriptor( 2609 | name='tokenIndex', full_name='edu.stanford.nlp.pipeline.TokenLocation.tokenIndex', index=1, 2610 | number=2, type=13, cpp_type=3, label=1, 2611 | has_default_value=False, default_value=0, 2612 | message_type=None, enum_type=None, containing_type=None, 2613 | is_extension=False, extension_scope=None, 2614 | options=None, file=DESCRIPTOR), 2615 | ], 2616 | extensions=[ 2617 | ], 2618 | nested_types=[], 2619 | enum_types=[ 2620 | ], 2621 | options=None, 2622 | is_extendable=False, 2623 | syntax='proto2', 2624 | extension_ranges=[], 2625 | oneofs=[ 2626 | ], 2627 | serialized_start=8503, 2628 | serialized_end=8561, 2629 | ) 2630 | 2631 | 2632 | _RELATIONTRIPLE = _descriptor.Descriptor( 2633 | name='RelationTriple', 2634 | full_name='edu.stanford.nlp.pipeline.RelationTriple', 2635 | filename=None, 2636 | file=DESCRIPTOR, 2637 | containing_type=None, 2638 | fields=[ 2639 | _descriptor.FieldDescriptor( 2640 | name='subject', full_name='edu.stanford.nlp.pipeline.RelationTriple.subject', index=0, 2641 | number=1, type=9, cpp_type=9, label=1, 2642 | has_default_value=False, default_value=_b("").decode('utf-8'), 2643 | message_type=None, enum_type=None, containing_type=None, 2644 | is_extension=False, extension_scope=None, 2645 | options=None, file=DESCRIPTOR), 2646 | _descriptor.FieldDescriptor( 2647 | name='relation', full_name='edu.stanford.nlp.pipeline.RelationTriple.relation', index=1, 2648 | number=2, type=9, cpp_type=9, label=1, 2649 | has_default_value=False, default_value=_b("").decode('utf-8'), 2650 | message_type=None, enum_type=None, containing_type=None, 2651 | is_extension=False, extension_scope=None, 2652 | options=None, file=DESCRIPTOR), 2653 | _descriptor.FieldDescriptor( 2654 | name='object', full_name='edu.stanford.nlp.pipeline.RelationTriple.object', index=2, 2655 | number=3, type=9, cpp_type=9, label=1, 2656 | has_default_value=False, default_value=_b("").decode('utf-8'), 2657 | message_type=None, enum_type=None, containing_type=None, 2658 | is_extension=False, extension_scope=None, 2659 | options=None, file=DESCRIPTOR), 2660 | _descriptor.FieldDescriptor( 2661 | name='confidence', full_name='edu.stanford.nlp.pipeline.RelationTriple.confidence', index=3, 2662 | number=4, type=1, cpp_type=5, label=1, 2663 | has_default_value=False, default_value=float(0), 2664 | message_type=None, enum_type=None, containing_type=None, 2665 | is_extension=False, extension_scope=None, 2666 | options=None, file=DESCRIPTOR), 2667 | _descriptor.FieldDescriptor( 2668 | name='subjectTokens', full_name='edu.stanford.nlp.pipeline.RelationTriple.subjectTokens', index=4, 2669 | number=13, type=11, cpp_type=10, label=3, 2670 | has_default_value=False, default_value=[], 2671 | message_type=None, enum_type=None, containing_type=None, 2672 | is_extension=False, extension_scope=None, 2673 | options=None, file=DESCRIPTOR), 2674 | _descriptor.FieldDescriptor( 2675 | name='relationTokens', full_name='edu.stanford.nlp.pipeline.RelationTriple.relationTokens', index=5, 2676 | number=14, type=11, cpp_type=10, label=3, 2677 | has_default_value=False, default_value=[], 2678 | message_type=None, enum_type=None, containing_type=None, 2679 | is_extension=False, extension_scope=None, 2680 | options=None, file=DESCRIPTOR), 2681 | _descriptor.FieldDescriptor( 2682 | name='objectTokens', full_name='edu.stanford.nlp.pipeline.RelationTriple.objectTokens', index=6, 2683 | number=15, type=11, cpp_type=10, label=3, 2684 | has_default_value=False, default_value=[], 2685 | message_type=None, enum_type=None, containing_type=None, 2686 | is_extension=False, extension_scope=None, 2687 | options=None, file=DESCRIPTOR), 2688 | _descriptor.FieldDescriptor( 2689 | name='tree', full_name='edu.stanford.nlp.pipeline.RelationTriple.tree', index=7, 2690 | number=8, type=11, cpp_type=10, label=1, 2691 | has_default_value=False, default_value=None, 2692 | message_type=None, enum_type=None, containing_type=None, 2693 | is_extension=False, extension_scope=None, 2694 | options=None, file=DESCRIPTOR), 2695 | _descriptor.FieldDescriptor( 2696 | name='istmod', full_name='edu.stanford.nlp.pipeline.RelationTriple.istmod', index=8, 2697 | number=9, type=8, cpp_type=7, label=1, 2698 | has_default_value=False, default_value=False, 2699 | message_type=None, enum_type=None, containing_type=None, 2700 | is_extension=False, extension_scope=None, 2701 | options=None, file=DESCRIPTOR), 2702 | _descriptor.FieldDescriptor( 2703 | name='prefixBe', full_name='edu.stanford.nlp.pipeline.RelationTriple.prefixBe', index=9, 2704 | number=10, type=8, cpp_type=7, label=1, 2705 | has_default_value=False, default_value=False, 2706 | message_type=None, enum_type=None, containing_type=None, 2707 | is_extension=False, extension_scope=None, 2708 | options=None, file=DESCRIPTOR), 2709 | _descriptor.FieldDescriptor( 2710 | name='suffixBe', full_name='edu.stanford.nlp.pipeline.RelationTriple.suffixBe', index=10, 2711 | number=11, type=8, cpp_type=7, label=1, 2712 | has_default_value=False, default_value=False, 2713 | message_type=None, enum_type=None, containing_type=None, 2714 | is_extension=False, extension_scope=None, 2715 | options=None, file=DESCRIPTOR), 2716 | _descriptor.FieldDescriptor( 2717 | name='suffixOf', full_name='edu.stanford.nlp.pipeline.RelationTriple.suffixOf', index=11, 2718 | number=12, type=8, cpp_type=7, label=1, 2719 | has_default_value=False, default_value=False, 2720 | message_type=None, enum_type=None, containing_type=None, 2721 | is_extension=False, extension_scope=None, 2722 | options=None, file=DESCRIPTOR), 2723 | ], 2724 | extensions=[ 2725 | ], 2726 | nested_types=[], 2727 | enum_types=[ 2728 | ], 2729 | options=None, 2730 | is_extendable=False, 2731 | syntax='proto2', 2732 | extension_ranges=[], 2733 | oneofs=[ 2734 | ], 2735 | serialized_start=8564, 2736 | serialized_end=8974, 2737 | ) 2738 | 2739 | 2740 | _MAPSTRINGSTRING = _descriptor.Descriptor( 2741 | name='MapStringString', 2742 | full_name='edu.stanford.nlp.pipeline.MapStringString', 2743 | filename=None, 2744 | file=DESCRIPTOR, 2745 | containing_type=None, 2746 | fields=[ 2747 | _descriptor.FieldDescriptor( 2748 | name='key', full_name='edu.stanford.nlp.pipeline.MapStringString.key', index=0, 2749 | number=1, type=9, cpp_type=9, label=3, 2750 | has_default_value=False, default_value=[], 2751 | message_type=None, enum_type=None, containing_type=None, 2752 | is_extension=False, extension_scope=None, 2753 | options=None, file=DESCRIPTOR), 2754 | _descriptor.FieldDescriptor( 2755 | name='value', full_name='edu.stanford.nlp.pipeline.MapStringString.value', index=1, 2756 | number=2, type=9, cpp_type=9, label=3, 2757 | has_default_value=False, default_value=[], 2758 | message_type=None, enum_type=None, containing_type=None, 2759 | is_extension=False, extension_scope=None, 2760 | options=None, file=DESCRIPTOR), 2761 | ], 2762 | extensions=[ 2763 | ], 2764 | nested_types=[], 2765 | enum_types=[ 2766 | ], 2767 | options=None, 2768 | is_extendable=False, 2769 | syntax='proto2', 2770 | extension_ranges=[], 2771 | oneofs=[ 2772 | ], 2773 | serialized_start=8976, 2774 | serialized_end=9021, 2775 | ) 2776 | 2777 | 2778 | _MAPINTSTRING = _descriptor.Descriptor( 2779 | name='MapIntString', 2780 | full_name='edu.stanford.nlp.pipeline.MapIntString', 2781 | filename=None, 2782 | file=DESCRIPTOR, 2783 | containing_type=None, 2784 | fields=[ 2785 | _descriptor.FieldDescriptor( 2786 | name='key', full_name='edu.stanford.nlp.pipeline.MapIntString.key', index=0, 2787 | number=1, type=13, cpp_type=3, label=3, 2788 | has_default_value=False, default_value=[], 2789 | message_type=None, enum_type=None, containing_type=None, 2790 | is_extension=False, extension_scope=None, 2791 | options=None, file=DESCRIPTOR), 2792 | _descriptor.FieldDescriptor( 2793 | name='value', full_name='edu.stanford.nlp.pipeline.MapIntString.value', index=1, 2794 | number=2, type=9, cpp_type=9, label=3, 2795 | has_default_value=False, default_value=[], 2796 | message_type=None, enum_type=None, containing_type=None, 2797 | is_extension=False, extension_scope=None, 2798 | options=None, file=DESCRIPTOR), 2799 | ], 2800 | extensions=[ 2801 | ], 2802 | nested_types=[], 2803 | enum_types=[ 2804 | ], 2805 | options=None, 2806 | is_extendable=False, 2807 | syntax='proto2', 2808 | extension_ranges=[], 2809 | oneofs=[ 2810 | ], 2811 | serialized_start=9023, 2812 | serialized_end=9065, 2813 | ) 2814 | 2815 | 2816 | _SECTION = _descriptor.Descriptor( 2817 | name='Section', 2818 | full_name='edu.stanford.nlp.pipeline.Section', 2819 | filename=None, 2820 | file=DESCRIPTOR, 2821 | containing_type=None, 2822 | fields=[ 2823 | _descriptor.FieldDescriptor( 2824 | name='charBegin', full_name='edu.stanford.nlp.pipeline.Section.charBegin', index=0, 2825 | number=1, type=13, cpp_type=3, label=2, 2826 | has_default_value=False, default_value=0, 2827 | message_type=None, enum_type=None, containing_type=None, 2828 | is_extension=False, extension_scope=None, 2829 | options=None, file=DESCRIPTOR), 2830 | _descriptor.FieldDescriptor( 2831 | name='charEnd', full_name='edu.stanford.nlp.pipeline.Section.charEnd', index=1, 2832 | number=2, type=13, cpp_type=3, label=2, 2833 | has_default_value=False, default_value=0, 2834 | message_type=None, enum_type=None, containing_type=None, 2835 | is_extension=False, extension_scope=None, 2836 | options=None, file=DESCRIPTOR), 2837 | _descriptor.FieldDescriptor( 2838 | name='author', full_name='edu.stanford.nlp.pipeline.Section.author', index=2, 2839 | number=3, type=9, cpp_type=9, label=1, 2840 | has_default_value=False, default_value=_b("").decode('utf-8'), 2841 | message_type=None, enum_type=None, containing_type=None, 2842 | is_extension=False, extension_scope=None, 2843 | options=None, file=DESCRIPTOR), 2844 | _descriptor.FieldDescriptor( 2845 | name='sentenceIndexes', full_name='edu.stanford.nlp.pipeline.Section.sentenceIndexes', index=3, 2846 | number=4, type=13, cpp_type=3, label=3, 2847 | has_default_value=False, default_value=[], 2848 | message_type=None, enum_type=None, containing_type=None, 2849 | is_extension=False, extension_scope=None, 2850 | options=None, file=DESCRIPTOR), 2851 | _descriptor.FieldDescriptor( 2852 | name='datetime', full_name='edu.stanford.nlp.pipeline.Section.datetime', index=4, 2853 | number=5, type=9, cpp_type=9, label=1, 2854 | has_default_value=False, default_value=_b("").decode('utf-8'), 2855 | message_type=None, enum_type=None, containing_type=None, 2856 | is_extension=False, extension_scope=None, 2857 | options=None, file=DESCRIPTOR), 2858 | _descriptor.FieldDescriptor( 2859 | name='quotes', full_name='edu.stanford.nlp.pipeline.Section.quotes', index=5, 2860 | number=6, type=11, cpp_type=10, label=3, 2861 | has_default_value=False, default_value=[], 2862 | message_type=None, enum_type=None, containing_type=None, 2863 | is_extension=False, extension_scope=None, 2864 | options=None, file=DESCRIPTOR), 2865 | _descriptor.FieldDescriptor( 2866 | name='authorCharBegin', full_name='edu.stanford.nlp.pipeline.Section.authorCharBegin', index=6, 2867 | number=7, type=13, cpp_type=3, label=1, 2868 | has_default_value=False, default_value=0, 2869 | message_type=None, enum_type=None, containing_type=None, 2870 | is_extension=False, extension_scope=None, 2871 | options=None, file=DESCRIPTOR), 2872 | _descriptor.FieldDescriptor( 2873 | name='authorCharEnd', full_name='edu.stanford.nlp.pipeline.Section.authorCharEnd', index=7, 2874 | number=8, type=13, cpp_type=3, label=1, 2875 | has_default_value=False, default_value=0, 2876 | message_type=None, enum_type=None, containing_type=None, 2877 | is_extension=False, extension_scope=None, 2878 | options=None, file=DESCRIPTOR), 2879 | _descriptor.FieldDescriptor( 2880 | name='xmlTag', full_name='edu.stanford.nlp.pipeline.Section.xmlTag', index=8, 2881 | number=9, type=11, cpp_type=10, label=2, 2882 | has_default_value=False, default_value=None, 2883 | message_type=None, enum_type=None, containing_type=None, 2884 | is_extension=False, extension_scope=None, 2885 | options=None, file=DESCRIPTOR), 2886 | ], 2887 | extensions=[ 2888 | ], 2889 | nested_types=[], 2890 | enum_types=[ 2891 | ], 2892 | options=None, 2893 | is_extendable=False, 2894 | syntax='proto2', 2895 | extension_ranges=[], 2896 | oneofs=[ 2897 | ], 2898 | serialized_start=9068, 2899 | serialized_end=9320, 2900 | ) 2901 | 2902 | _DOCUMENT.fields_by_name['sentence'].message_type = _SENTENCE 2903 | _DOCUMENT.fields_by_name['corefChain'].message_type = _COREFCHAIN 2904 | _DOCUMENT.fields_by_name['sentencelessToken'].message_type = _TOKEN 2905 | _DOCUMENT.fields_by_name['character'].message_type = _TOKEN 2906 | _DOCUMENT.fields_by_name['quote'].message_type = _QUOTE 2907 | _DOCUMENT.fields_by_name['mentions'].message_type = _NERMENTION 2908 | _DOCUMENT.fields_by_name['sections'].message_type = _SECTION 2909 | _DOCUMENT.fields_by_name['mentionsForCoref'].message_type = _MENTION 2910 | _SENTENCE.fields_by_name['token'].message_type = _TOKEN 2911 | _SENTENCE.fields_by_name['parseTree'].message_type = _PARSETREE 2912 | _SENTENCE.fields_by_name['binarizedParseTree'].message_type = _PARSETREE 2913 | _SENTENCE.fields_by_name['annotatedParseTree'].message_type = _PARSETREE 2914 | _SENTENCE.fields_by_name['kBestParseTrees'].message_type = _PARSETREE 2915 | _SENTENCE.fields_by_name['basicDependencies'].message_type = _DEPENDENCYGRAPH 2916 | _SENTENCE.fields_by_name['collapsedDependencies'].message_type = _DEPENDENCYGRAPH 2917 | _SENTENCE.fields_by_name['collapsedCCProcessedDependencies'].message_type = _DEPENDENCYGRAPH 2918 | _SENTENCE.fields_by_name['alternativeDependencies'].message_type = _DEPENDENCYGRAPH 2919 | _SENTENCE.fields_by_name['openieTriple'].message_type = _RELATIONTRIPLE 2920 | _SENTENCE.fields_by_name['kbpTriple'].message_type = _RELATIONTRIPLE 2921 | _SENTENCE.fields_by_name['entailedSentence'].message_type = _SENTENCEFRAGMENT 2922 | _SENTENCE.fields_by_name['entailedClause'].message_type = _SENTENCEFRAGMENT 2923 | _SENTENCE.fields_by_name['enhancedDependencies'].message_type = _DEPENDENCYGRAPH 2924 | _SENTENCE.fields_by_name['enhancedPlusPlusDependencies'].message_type = _DEPENDENCYGRAPH 2925 | _SENTENCE.fields_by_name['character'].message_type = _TOKEN 2926 | _SENTENCE.fields_by_name['entity'].message_type = _ENTITY 2927 | _SENTENCE.fields_by_name['relation'].message_type = _RELATION 2928 | _SENTENCE.fields_by_name['mentions'].message_type = _NERMENTION 2929 | _SENTENCE.fields_by_name['mentionsForCoref'].message_type = _MENTION 2930 | _TOKEN.fields_by_name['timexValue'].message_type = _TIMEX 2931 | _TOKEN.fields_by_name['operator'].message_type = _OPERATOR 2932 | _TOKEN.fields_by_name['polarity'].message_type = _POLARITY 2933 | _TOKEN.fields_by_name['span'].message_type = _SPAN 2934 | _TOKEN.fields_by_name['conllUFeatures'].message_type = _MAPSTRINGSTRING 2935 | _TOKEN.fields_by_name['conllUTokenSpan'].message_type = _SPAN 2936 | _TOKEN.fields_by_name['conllUSecondaryDeps'].message_type = _MAPSTRINGSTRING 2937 | _QUOTE.fields_by_name['attributionDependencyGraph'].message_type = _DEPENDENCYGRAPH 2938 | _PARSETREE.fields_by_name['child'].message_type = _PARSETREE 2939 | _PARSETREE.fields_by_name['sentiment'].enum_type = _SENTIMENT 2940 | _DEPENDENCYGRAPH_NODE.containing_type = _DEPENDENCYGRAPH 2941 | _DEPENDENCYGRAPH_EDGE.fields_by_name['language'].enum_type = _LANGUAGE 2942 | _DEPENDENCYGRAPH_EDGE.containing_type = _DEPENDENCYGRAPH 2943 | _DEPENDENCYGRAPH.fields_by_name['node'].message_type = _DEPENDENCYGRAPH_NODE 2944 | _DEPENDENCYGRAPH.fields_by_name['edge'].message_type = _DEPENDENCYGRAPH_EDGE 2945 | _COREFCHAIN_COREFMENTION.containing_type = _COREFCHAIN 2946 | _COREFCHAIN.fields_by_name['mention'].message_type = _COREFCHAIN_COREFMENTION 2947 | _MENTION.fields_by_name['headIndexedWord'].message_type = _INDEXEDWORD 2948 | _MENTION.fields_by_name['dependingVerb'].message_type = _INDEXEDWORD 2949 | _MENTION.fields_by_name['headWord'].message_type = _INDEXEDWORD 2950 | _MENTION.fields_by_name['speakerInfo'].message_type = _SPEAKERINFO 2951 | _MENTION.fields_by_name['sentenceWords'].message_type = _INDEXEDWORD 2952 | _MENTION.fields_by_name['originalSpan'].message_type = _INDEXEDWORD 2953 | _RELATION.fields_by_name['arg'].message_type = _ENTITY 2954 | _POLARITY.fields_by_name['projectEquivalence'].enum_type = _NATURALLOGICRELATION 2955 | _POLARITY.fields_by_name['projectForwardEntailment'].enum_type = _NATURALLOGICRELATION 2956 | _POLARITY.fields_by_name['projectReverseEntailment'].enum_type = _NATURALLOGICRELATION 2957 | _POLARITY.fields_by_name['projectNegation'].enum_type = _NATURALLOGICRELATION 2958 | _POLARITY.fields_by_name['projectAlternation'].enum_type = _NATURALLOGICRELATION 2959 | _POLARITY.fields_by_name['projectCover'].enum_type = _NATURALLOGICRELATION 2960 | _POLARITY.fields_by_name['projectIndependence'].enum_type = _NATURALLOGICRELATION 2961 | _NERMENTION.fields_by_name['timex'].message_type = _TIMEX 2962 | _RELATIONTRIPLE.fields_by_name['subjectTokens'].message_type = _TOKENLOCATION 2963 | _RELATIONTRIPLE.fields_by_name['relationTokens'].message_type = _TOKENLOCATION 2964 | _RELATIONTRIPLE.fields_by_name['objectTokens'].message_type = _TOKENLOCATION 2965 | _RELATIONTRIPLE.fields_by_name['tree'].message_type = _DEPENDENCYGRAPH 2966 | _SECTION.fields_by_name['quotes'].message_type = _QUOTE 2967 | _SECTION.fields_by_name['xmlTag'].message_type = _TOKEN 2968 | DESCRIPTOR.message_types_by_name['Document'] = _DOCUMENT 2969 | DESCRIPTOR.message_types_by_name['Sentence'] = _SENTENCE 2970 | DESCRIPTOR.message_types_by_name['Token'] = _TOKEN 2971 | DESCRIPTOR.message_types_by_name['Quote'] = _QUOTE 2972 | DESCRIPTOR.message_types_by_name['ParseTree'] = _PARSETREE 2973 | DESCRIPTOR.message_types_by_name['DependencyGraph'] = _DEPENDENCYGRAPH 2974 | DESCRIPTOR.message_types_by_name['CorefChain'] = _COREFCHAIN 2975 | DESCRIPTOR.message_types_by_name['Mention'] = _MENTION 2976 | DESCRIPTOR.message_types_by_name['IndexedWord'] = _INDEXEDWORD 2977 | DESCRIPTOR.message_types_by_name['SpeakerInfo'] = _SPEAKERINFO 2978 | DESCRIPTOR.message_types_by_name['Span'] = _SPAN 2979 | DESCRIPTOR.message_types_by_name['Timex'] = _TIMEX 2980 | DESCRIPTOR.message_types_by_name['Entity'] = _ENTITY 2981 | DESCRIPTOR.message_types_by_name['Relation'] = _RELATION 2982 | DESCRIPTOR.message_types_by_name['Operator'] = _OPERATOR 2983 | DESCRIPTOR.message_types_by_name['Polarity'] = _POLARITY 2984 | DESCRIPTOR.message_types_by_name['NERMention'] = _NERMENTION 2985 | DESCRIPTOR.message_types_by_name['SentenceFragment'] = _SENTENCEFRAGMENT 2986 | DESCRIPTOR.message_types_by_name['TokenLocation'] = _TOKENLOCATION 2987 | DESCRIPTOR.message_types_by_name['RelationTriple'] = _RELATIONTRIPLE 2988 | DESCRIPTOR.message_types_by_name['MapStringString'] = _MAPSTRINGSTRING 2989 | DESCRIPTOR.message_types_by_name['MapIntString'] = _MAPINTSTRING 2990 | DESCRIPTOR.message_types_by_name['Section'] = _SECTION 2991 | DESCRIPTOR.enum_types_by_name['Language'] = _LANGUAGE 2992 | DESCRIPTOR.enum_types_by_name['Sentiment'] = _SENTIMENT 2993 | DESCRIPTOR.enum_types_by_name['NaturalLogicRelation'] = _NATURALLOGICRELATION 2994 | _sym_db.RegisterFileDescriptor(DESCRIPTOR) 2995 | 2996 | Document = _reflection.GeneratedProtocolMessageType('Document', (_message.Message,), dict( 2997 | DESCRIPTOR = _DOCUMENT, 2998 | __module__ = 'CoreNLP_pb2' 2999 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.Document) 3000 | )) 3001 | _sym_db.RegisterMessage(Document) 3002 | 3003 | Sentence = _reflection.GeneratedProtocolMessageType('Sentence', (_message.Message,), dict( 3004 | DESCRIPTOR = _SENTENCE, 3005 | __module__ = 'CoreNLP_pb2' 3006 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.Sentence) 3007 | )) 3008 | _sym_db.RegisterMessage(Sentence) 3009 | 3010 | Token = _reflection.GeneratedProtocolMessageType('Token', (_message.Message,), dict( 3011 | DESCRIPTOR = _TOKEN, 3012 | __module__ = 'CoreNLP_pb2' 3013 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.Token) 3014 | )) 3015 | _sym_db.RegisterMessage(Token) 3016 | 3017 | Quote = _reflection.GeneratedProtocolMessageType('Quote', (_message.Message,), dict( 3018 | DESCRIPTOR = _QUOTE, 3019 | __module__ = 'CoreNLP_pb2' 3020 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.Quote) 3021 | )) 3022 | _sym_db.RegisterMessage(Quote) 3023 | 3024 | ParseTree = _reflection.GeneratedProtocolMessageType('ParseTree', (_message.Message,), dict( 3025 | DESCRIPTOR = _PARSETREE, 3026 | __module__ = 'CoreNLP_pb2' 3027 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.ParseTree) 3028 | )) 3029 | _sym_db.RegisterMessage(ParseTree) 3030 | 3031 | DependencyGraph = _reflection.GeneratedProtocolMessageType('DependencyGraph', (_message.Message,), dict( 3032 | 3033 | Node = _reflection.GeneratedProtocolMessageType('Node', (_message.Message,), dict( 3034 | DESCRIPTOR = _DEPENDENCYGRAPH_NODE, 3035 | __module__ = 'CoreNLP_pb2' 3036 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.DependencyGraph.Node) 3037 | )) 3038 | , 3039 | 3040 | Edge = _reflection.GeneratedProtocolMessageType('Edge', (_message.Message,), dict( 3041 | DESCRIPTOR = _DEPENDENCYGRAPH_EDGE, 3042 | __module__ = 'CoreNLP_pb2' 3043 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.DependencyGraph.Edge) 3044 | )) 3045 | , 3046 | DESCRIPTOR = _DEPENDENCYGRAPH, 3047 | __module__ = 'CoreNLP_pb2' 3048 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.DependencyGraph) 3049 | )) 3050 | _sym_db.RegisterMessage(DependencyGraph) 3051 | _sym_db.RegisterMessage(DependencyGraph.Node) 3052 | _sym_db.RegisterMessage(DependencyGraph.Edge) 3053 | 3054 | CorefChain = _reflection.GeneratedProtocolMessageType('CorefChain', (_message.Message,), dict( 3055 | 3056 | CorefMention = _reflection.GeneratedProtocolMessageType('CorefMention', (_message.Message,), dict( 3057 | DESCRIPTOR = _COREFCHAIN_COREFMENTION, 3058 | __module__ = 'CoreNLP_pb2' 3059 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.CorefChain.CorefMention) 3060 | )) 3061 | , 3062 | DESCRIPTOR = _COREFCHAIN, 3063 | __module__ = 'CoreNLP_pb2' 3064 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.CorefChain) 3065 | )) 3066 | _sym_db.RegisterMessage(CorefChain) 3067 | _sym_db.RegisterMessage(CorefChain.CorefMention) 3068 | 3069 | Mention = _reflection.GeneratedProtocolMessageType('Mention', (_message.Message,), dict( 3070 | DESCRIPTOR = _MENTION, 3071 | __module__ = 'CoreNLP_pb2' 3072 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.Mention) 3073 | )) 3074 | _sym_db.RegisterMessage(Mention) 3075 | 3076 | IndexedWord = _reflection.GeneratedProtocolMessageType('IndexedWord', (_message.Message,), dict( 3077 | DESCRIPTOR = _INDEXEDWORD, 3078 | __module__ = 'CoreNLP_pb2' 3079 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.IndexedWord) 3080 | )) 3081 | _sym_db.RegisterMessage(IndexedWord) 3082 | 3083 | SpeakerInfo = _reflection.GeneratedProtocolMessageType('SpeakerInfo', (_message.Message,), dict( 3084 | DESCRIPTOR = _SPEAKERINFO, 3085 | __module__ = 'CoreNLP_pb2' 3086 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.SpeakerInfo) 3087 | )) 3088 | _sym_db.RegisterMessage(SpeakerInfo) 3089 | 3090 | Span = _reflection.GeneratedProtocolMessageType('Span', (_message.Message,), dict( 3091 | DESCRIPTOR = _SPAN, 3092 | __module__ = 'CoreNLP_pb2' 3093 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.Span) 3094 | )) 3095 | _sym_db.RegisterMessage(Span) 3096 | 3097 | Timex = _reflection.GeneratedProtocolMessageType('Timex', (_message.Message,), dict( 3098 | DESCRIPTOR = _TIMEX, 3099 | __module__ = 'CoreNLP_pb2' 3100 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.Timex) 3101 | )) 3102 | _sym_db.RegisterMessage(Timex) 3103 | 3104 | Entity = _reflection.GeneratedProtocolMessageType('Entity', (_message.Message,), dict( 3105 | DESCRIPTOR = _ENTITY, 3106 | __module__ = 'CoreNLP_pb2' 3107 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.Entity) 3108 | )) 3109 | _sym_db.RegisterMessage(Entity) 3110 | 3111 | Relation = _reflection.GeneratedProtocolMessageType('Relation', (_message.Message,), dict( 3112 | DESCRIPTOR = _RELATION, 3113 | __module__ = 'CoreNLP_pb2' 3114 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.Relation) 3115 | )) 3116 | _sym_db.RegisterMessage(Relation) 3117 | 3118 | Operator = _reflection.GeneratedProtocolMessageType('Operator', (_message.Message,), dict( 3119 | DESCRIPTOR = _OPERATOR, 3120 | __module__ = 'CoreNLP_pb2' 3121 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.Operator) 3122 | )) 3123 | _sym_db.RegisterMessage(Operator) 3124 | 3125 | Polarity = _reflection.GeneratedProtocolMessageType('Polarity', (_message.Message,), dict( 3126 | DESCRIPTOR = _POLARITY, 3127 | __module__ = 'CoreNLP_pb2' 3128 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.Polarity) 3129 | )) 3130 | _sym_db.RegisterMessage(Polarity) 3131 | 3132 | NERMention = _reflection.GeneratedProtocolMessageType('NERMention', (_message.Message,), dict( 3133 | DESCRIPTOR = _NERMENTION, 3134 | __module__ = 'CoreNLP_pb2' 3135 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.NERMention) 3136 | )) 3137 | _sym_db.RegisterMessage(NERMention) 3138 | 3139 | SentenceFragment = _reflection.GeneratedProtocolMessageType('SentenceFragment', (_message.Message,), dict( 3140 | DESCRIPTOR = _SENTENCEFRAGMENT, 3141 | __module__ = 'CoreNLP_pb2' 3142 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.SentenceFragment) 3143 | )) 3144 | _sym_db.RegisterMessage(SentenceFragment) 3145 | 3146 | TokenLocation = _reflection.GeneratedProtocolMessageType('TokenLocation', (_message.Message,), dict( 3147 | DESCRIPTOR = _TOKENLOCATION, 3148 | __module__ = 'CoreNLP_pb2' 3149 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.TokenLocation) 3150 | )) 3151 | _sym_db.RegisterMessage(TokenLocation) 3152 | 3153 | RelationTriple = _reflection.GeneratedProtocolMessageType('RelationTriple', (_message.Message,), dict( 3154 | DESCRIPTOR = _RELATIONTRIPLE, 3155 | __module__ = 'CoreNLP_pb2' 3156 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.RelationTriple) 3157 | )) 3158 | _sym_db.RegisterMessage(RelationTriple) 3159 | 3160 | MapStringString = _reflection.GeneratedProtocolMessageType('MapStringString', (_message.Message,), dict( 3161 | DESCRIPTOR = _MAPSTRINGSTRING, 3162 | __module__ = 'CoreNLP_pb2' 3163 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.MapStringString) 3164 | )) 3165 | _sym_db.RegisterMessage(MapStringString) 3166 | 3167 | MapIntString = _reflection.GeneratedProtocolMessageType('MapIntString', (_message.Message,), dict( 3168 | DESCRIPTOR = _MAPINTSTRING, 3169 | __module__ = 'CoreNLP_pb2' 3170 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.MapIntString) 3171 | )) 3172 | _sym_db.RegisterMessage(MapIntString) 3173 | 3174 | Section = _reflection.GeneratedProtocolMessageType('Section', (_message.Message,), dict( 3175 | DESCRIPTOR = _SECTION, 3176 | __module__ = 'CoreNLP_pb2' 3177 | # @@protoc_insertion_point(class_scope:edu.stanford.nlp.pipeline.Section) 3178 | )) 3179 | _sym_db.RegisterMessage(Section) 3180 | 3181 | 3182 | DESCRIPTOR.has_options = True 3183 | DESCRIPTOR._options = _descriptor._ParseOptions(descriptor_pb2.FileOptions(), _b('\n\031edu.stanford.nlp.pipelineB\rCoreNLPProtos')) 3184 | _DEPENDENCYGRAPH.fields_by_name['root'].has_options = True 3185 | _DEPENDENCYGRAPH.fields_by_name['root']._options = _descriptor._ParseOptions(descriptor_pb2.FieldOptions(), _b('\020\001')) 3186 | # @@protoc_insertion_point(module_scope) 3187 | -------------------------------------------------------------------------------- /corenlp_protobuf/__init__.py: -------------------------------------------------------------------------------- 1 | from __future__ import absolute_import 2 | 3 | from io import BytesIO 4 | 5 | from google.protobuf.internal.encoder import _EncodeVarint 6 | from google.protobuf.internal.decoder import _DecodeVarint 7 | from .CoreNLP_pb2 import * 8 | 9 | def parseFromDelimitedString(obj, buf, offset=0): 10 | """ 11 | Stanford CoreNLP uses the Java "writeDelimitedTo" function, which 12 | writes the size (and offset) of the buffer before writing the object. 13 | This function handles parsing this message starting from offset 0. 14 | 15 | @returns how many bytes of @buf were consumed. 16 | """ 17 | size, pos = _DecodeVarint(buf, offset) 18 | obj.ParseFromString(buf[offset+pos:offset+pos+size]) 19 | return pos+size 20 | 21 | def writeToDelimitedString(obj, stream=None): 22 | """ 23 | Stanford CoreNLP uses the Java "writeDelimitedTo" function, which 24 | writes the size (and offset) of the buffer before writing the object. 25 | This function handles parsing this message starting from offset 0. 26 | 27 | @returns how many bytes of @buf were consumed. 28 | """ 29 | if stream is None: 30 | stream = BytesIO() 31 | 32 | _EncodeVarint(stream.write, obj.ByteSize(), True) 33 | stream.write(obj.SerializeToString()) 34 | return stream 35 | 36 | def to_text(sentence): 37 | """ 38 | Helper routine that converts a Sentence protobuf to a string from 39 | its tokens. 40 | """ 41 | text = "" 42 | for i, tok in enumerate(sentence.token): 43 | if i != 0: 44 | text += tok.before 45 | text += tok.word 46 | return text 47 | -------------------------------------------------------------------------------- /doc/CoreNLP.proto: -------------------------------------------------------------------------------- 1 | package edu.stanford.nlp.pipeline; 2 | 3 | option java_package = "edu.stanford.nlp.pipeline"; 4 | option java_outer_classname = "CoreNLPProtos"; 5 | 6 | // 7 | // From JAVANLP_HOME, you can build me with the command: 8 | // 9 | // protoc -I=projects/core/src/edu/stanford/nlp/pipeline/ --java_out=projects/core/src projects/core/src/edu/stanford/nlp/pipeline/CoreNLP.proto 10 | // 11 | 12 | // 13 | // An enumeration for the valid languages allowed in CoreNLP 14 | // 15 | enum Language { 16 | Unknown = 0; 17 | Any = 1; 18 | Arabic = 2; 19 | Chinese = 3; 20 | English = 4; 21 | German = 5; 22 | French = 6; 23 | Hebrew = 7; 24 | Spanish = 8; 25 | UniversalEnglish = 9; 26 | UniversalChinese = 10; 27 | } 28 | 29 | // 30 | // A document; that is, the equivalent of an Annotation. 31 | // 32 | message Document { 33 | required string text = 1; 34 | repeated Sentence sentence = 2; 35 | repeated CorefChain corefChain = 3; 36 | optional string docID = 4; 37 | optional string docDate = 7; 38 | optional uint64 calendar = 8; 39 | 40 | /** 41 | * A peculiar field, for the corner case when a Document is 42 | * serialized without any sentences. Otherwise 43 | */ 44 | repeated Token sentencelessToken = 5; 45 | repeated Token character = 10; 46 | 47 | repeated Quote quote = 6; 48 | /** 49 | * This field is for entity mentions across the document. 50 | */ 51 | repeated NERMention mentions = 9; 52 | optional bool hasEntityMentionsAnnotation = 13; // used to differentiate between null and empty list 53 | 54 | /** 55 | * xml information 56 | */ 57 | optional bool xmlDoc = 11; 58 | repeated Section sections = 12; 59 | 60 | /** coref mentions for entire document **/ 61 | repeated Mention mentionsForCoref = 14; 62 | optional bool hasCorefMentionAnnotation = 15; 63 | optional bool hasCorefAnnotation = 16; 64 | repeated uint32 corefMentionToEntityMentionMappings = 17; 65 | repeated uint32 entityMentionToCorefMentionMappings = 18; 66 | 67 | extensions 100 to 255; 68 | } 69 | 70 | // 71 | // The serialized version of a CoreMap representing a sentence. 72 | // 73 | message Sentence { 74 | repeated Token token = 1; 75 | required uint32 tokenOffsetBegin = 2; 76 | required uint32 tokenOffsetEnd = 3; 77 | optional uint32 sentenceIndex = 4; 78 | optional uint32 characterOffsetBegin = 5; 79 | optional uint32 characterOffsetEnd = 6; 80 | optional ParseTree parseTree = 7; 81 | optional ParseTree binarizedParseTree = 31; 82 | optional ParseTree annotatedParseTree = 32; 83 | optional string sentiment = 33; 84 | repeated ParseTree kBestParseTrees = 34; 85 | optional DependencyGraph basicDependencies = 8; 86 | optional DependencyGraph collapsedDependencies = 9; 87 | optional DependencyGraph collapsedCCProcessedDependencies = 10; 88 | optional DependencyGraph alternativeDependencies = 13; 89 | repeated RelationTriple openieTriple = 14; // The OpenIE triples in the sentence 90 | repeated RelationTriple kbpTriple = 16; // The KBP triples in this sentence 91 | repeated SentenceFragment entailedSentence = 15; // The entailed sentences, by natural logic 92 | repeated SentenceFragment entailedClause = 35; // The entailed clauses, by natural logic 93 | optional DependencyGraph enhancedDependencies = 17; 94 | optional DependencyGraph enhancedPlusPlusDependencies = 18; 95 | repeated Token character = 19; 96 | 97 | optional uint32 paragraph = 11; 98 | 99 | optional string text = 12; // Only needed if we're only saving the sentence. 100 | 101 | optional uint32 lineNumber = 20; 102 | 103 | // Fields set by other annotators in CoreNLP 104 | optional bool hasRelationAnnotations = 51; 105 | repeated Entity entity = 52; 106 | repeated Relation relation = 53; 107 | optional bool hasNumerizedTokensAnnotation = 54; 108 | repeated NERMention mentions = 55; 109 | repeated Mention mentionsForCoref = 56; 110 | optional bool hasCorefMentionsAnnotation = 57; 111 | 112 | optional string sentenceID = 58; // Useful when storing sentences (e.g. ForEach) 113 | optional string sectionDate = 59; // date of section 114 | optional uint32 sectionIndex = 60; // section index for this sentence's section 115 | optional string sectionName = 61; // name of section 116 | optional string sectionAuthor = 62; // author of section 117 | optional string docID = 63; // doc id 118 | optional bool sectionQuoted = 64; // is this sentence in an xml quote in a post 119 | 120 | optional bool hasEntityMentionsAnnotation = 65; // check if there are entity mentions 121 | optional bool hasKBPTriplesAnnotation = 68; // check if there are KBP triples 122 | optional bool hasOpenieTriplesAnnotation = 69; // check if there are OpenIE triples 123 | 124 | // quote stuff 125 | optional uint32 chapterIndex = 66; 126 | optional uint32 paragraphIndex = 67; 127 | 128 | extensions 100 to 255; 129 | } 130 | 131 | // 132 | // The serialized version of a Token (a CoreLabel). 133 | // 134 | message Token { 135 | // Fields set by the default annotators [new CoreNLP(new Properties())] 136 | optional string word = 1; // the word's gloss (post-tokenization) 137 | optional string pos = 2; // The word's part of speech tag 138 | optional string value = 3; // The word's 'value', (e.g., parse tree node) 139 | optional string category = 4; // The word's 'category' (e.g., parse tree node) 140 | optional string before = 5; // The whitespace/xml before the token 141 | optional string after = 6; // The whitespace/xml after the token 142 | optional string originalText = 7; // The original text for this token 143 | optional string ner = 8; // The word's NER tag 144 | optional string coarseNER = 62; // The word's coarse NER tag 145 | optional string fineGrainedNER = 63; // The word's fine-grained NER tag 146 | optional string normalizedNER = 9; // The word's normalized NER tag 147 | optional string lemma = 10; // The word's lemma 148 | optional uint32 beginChar = 11; // The character offset begin, in the document 149 | optional uint32 endChar = 12; // The character offset end, in the document 150 | optional uint32 utterance = 13; // The utterance tag used in dcoref 151 | optional string speaker = 14; // The speaker speaking this word 152 | optional uint32 beginIndex = 15; // The begin index of, e.g., a span 153 | optional uint32 endIndex = 16; // The begin index of, e.g., a span 154 | optional uint32 tokenBeginIndex = 17; // The begin index of the token 155 | optional uint32 tokenEndIndex = 18; // The end index of the token 156 | optional Timex timexValue = 19; // The time this word refers to 157 | optional bool hasXmlContext = 21; // Used by clean xml annotator 158 | repeated string xmlContext = 22; // Used by clean xml annotator 159 | optional uint32 corefClusterID = 23; // The [primary] cluster id for this token 160 | optional string answer = 24; // A temporary annotation which is occasionally left in 161 | // optional string projectedCategory = 25; // The syntactic category of the maximal constituent headed by the word. Not used anywhere, so deleted. 162 | optional uint32 headWordIndex = 26; // The index of the head word of this word. 163 | optional Operator operator = 27; // If this is an operator, which one is it and what is its scope (as per Natural Logic)? 164 | optional Polarity polarity = 28; // The polarity of this word, according to Natural Logic 165 | optional string polarity_dir = 39; // The polarity of this word, either "up", "down", or "flat" 166 | optional Span span = 29; // The span of a leaf node of a tree 167 | optional string sentiment = 30; // The final sentiment of the sentence 168 | optional int32 quotationIndex = 31; // The index of the quotation this token refers to 169 | optional MapStringString conllUFeatures = 32; 170 | optional string coarseTag = 33; // The coarse POS tag (used to store the UPOS tag) 171 | optional Span conllUTokenSpan = 34; 172 | optional string conllUMisc = 35; 173 | optional MapStringString conllUSecondaryDeps = 36; 174 | optional string wikipediaEntity = 37; 175 | optional bool isNewline = 38; 176 | 177 | 178 | // Fields set by other annotators in CoreNLP 179 | optional string gender = 51; // gender annotation (machine reading) 180 | optional string trueCase = 52; // true case type of token 181 | optional string trueCaseText = 53; // true case gloss of token 182 | 183 | // Chinese character info 184 | optional string chineseChar = 54; 185 | optional string chineseSeg = 55; 186 | optional string chineseXMLChar = 60; 187 | 188 | // Section info 189 | optional string sectionName = 56; 190 | optional string sectionAuthor = 57; 191 | optional string sectionDate = 58; 192 | optional string sectionEndLabel = 59; 193 | 194 | // French tokens have parents 195 | optional string parent = 61; 196 | 197 | // mention index info 198 | repeated uint32 corefMentionIndex = 64; 199 | optional uint32 entityMentionIndex = 65; 200 | 201 | // Fields in the CoreLabel java class that are moved elsewhere 202 | // string text @see Document#text + character offsets 203 | // uint32 sentenceIndex @see Sentence#sentenceIndex 204 | // string docID @see Document#docID 205 | // uint32 index @see implicit in Sentence 206 | // uint32 paragraph @see Sentence#paragraph 207 | 208 | extensions 100 to 255; 209 | } 210 | 211 | // 212 | // An enumeration of valid sentiment values for the sentiment classifier. 213 | // 214 | enum Sentiment { 215 | STRONG_NEGATIVE = 0; 216 | WEAK_NEGATIVE = 1; 217 | NEUTRAL = 2; 218 | WEAK_POSITIVE = 3; 219 | STRONG_POSITIVE = 4; 220 | } 221 | 222 | // 223 | // A quotation marker in text 224 | // 225 | message Quote { 226 | optional string text = 1; 227 | optional uint32 begin = 2; 228 | optional uint32 end = 3; 229 | optional uint32 sentenceBegin = 5; 230 | optional uint32 sentenceEnd = 6; 231 | optional uint32 tokenBegin = 7; 232 | optional uint32 tokenEnd = 8; 233 | optional string docid = 9; 234 | optional uint32 index = 10; 235 | optional string author = 11; 236 | optional string mention = 12; 237 | optional uint32 mentionBegin = 13; 238 | optional uint32 mentionEnd = 14; 239 | optional string mentionType = 15; 240 | optional string mentionSieve = 16; 241 | optional string speaker = 17; 242 | optional string speakerSieve = 18; 243 | optional string canonicalMention = 19; 244 | optional uint32 canonicalMentionBegin = 20; 245 | optional uint32 canonicalMentionEnd = 21; 246 | optional DependencyGraph attributionDependencyGraph = 22; 247 | } 248 | 249 | // 250 | // A syntactic parse tree, with scores. 251 | // 252 | message ParseTree { 253 | repeated ParseTree child = 1; 254 | optional string value = 2; 255 | optional uint32 yieldBeginIndex = 3; 256 | optional uint32 yieldEndIndex = 4; 257 | optional double score = 5; 258 | optional Sentiment sentiment = 6; 259 | } 260 | 261 | // 262 | // A dependency graph representation. 263 | // 264 | message DependencyGraph { 265 | message Node { 266 | required uint32 sentenceIndex = 1; 267 | required uint32 index = 2; 268 | optional uint32 copyAnnotation = 3; 269 | } 270 | 271 | message Edge { 272 | required uint32 source = 1; 273 | required uint32 target = 2; 274 | optional string dep = 3; 275 | optional bool isExtra = 4; 276 | optional uint32 sourceCopy = 5; 277 | optional uint32 targetCopy = 6; 278 | optional Language language = 7 [default=Unknown]; 279 | } 280 | 281 | repeated Node node = 1; 282 | repeated Edge edge = 2; 283 | repeated uint32 root = 3 [packed=true]; 284 | } 285 | 286 | // 287 | // A coreference chain. 288 | // These fields are not *really* optional. CoreNLP will crash without them. 289 | // 290 | message CorefChain { 291 | message CorefMention { 292 | optional int32 mentionID = 1; 293 | optional string mentionType = 2; 294 | optional string number = 3; 295 | optional string gender = 4; 296 | optional string animacy = 5; 297 | optional uint32 beginIndex = 6; 298 | optional uint32 endIndex = 7; 299 | optional uint32 headIndex = 9; 300 | optional uint32 sentenceIndex = 10; 301 | optional uint32 position = 11; // the second element of position 302 | } 303 | 304 | required int32 chainID = 1; 305 | repeated CorefMention mention = 2; 306 | required uint32 representative = 3; 307 | } 308 | 309 | // 310 | // a mention 311 | // 312 | 313 | message Mention { 314 | optional int32 mentionID = 1; 315 | optional string mentionType = 2; 316 | optional string number = 3; 317 | optional string gender = 4; 318 | optional string animacy = 5; 319 | optional string person = 6; 320 | optional uint32 startIndex = 7; 321 | optional uint32 endIndex = 9; 322 | optional uint32 headIndex = 10; 323 | optional string headString = 11; 324 | optional string nerString = 12; 325 | optional uint32 originalRef = 13; 326 | optional int32 goldCorefClusterID = 14; 327 | optional int32 corefClusterID = 15; 328 | optional uint32 mentionNum = 16; 329 | optional uint32 sentNum = 17; 330 | optional uint32 utter = 18; 331 | optional uint32 paragraph = 19; 332 | optional bool isSubject = 20; 333 | optional bool isDirectObject = 21; 334 | optional bool isIndirectObject = 22; 335 | optional bool isPrepositionObject = 23; 336 | optional bool hasTwin = 24; 337 | optional bool generic = 25; 338 | optional bool isSingleton = 26; 339 | optional bool hasBasicDependency = 27; 340 | optional bool hasEnhancedDepenedncy = 28; 341 | optional bool hasContextParseTree = 29; 342 | optional IndexedWord headIndexedWord = 30; 343 | optional IndexedWord dependingVerb = 31; 344 | optional IndexedWord headWord = 32; 345 | optional SpeakerInfo speakerInfo = 33; 346 | 347 | repeated IndexedWord sentenceWords = 50; 348 | repeated IndexedWord originalSpan = 51; 349 | repeated string dependents = 52; 350 | repeated string preprocessedTerms = 53; 351 | repeated int32 appositions = 54; 352 | repeated int32 predicateNominatives = 55; 353 | repeated int32 relativePronouns = 56; 354 | repeated int32 listMembers = 57; 355 | repeated int32 belongToLists = 58; 356 | 357 | } 358 | 359 | // 360 | // store the position (sentence, token index) of a CoreLabel 361 | // 362 | 363 | message IndexedWord { 364 | optional uint32 sentenceNum = 1; 365 | optional uint32 tokenIndex = 2; 366 | optional uint32 docID = 3; 367 | optional uint32 copyCount = 4; 368 | } 369 | 370 | // 371 | // speaker info, this is used for Mentions 372 | // 373 | 374 | message SpeakerInfo { 375 | optional string speakerName = 1; 376 | repeated int32 mentions = 2; 377 | } 378 | 379 | // 380 | // A Span of text 381 | // 382 | message Span { 383 | required uint32 begin = 1; 384 | required uint32 end = 2; 385 | } 386 | 387 | // 388 | // A Timex object, representing a temporal expression (TIMe EXpression) 389 | // These fields are not *really* optional. CoreNLP will crash without them. 390 | // 391 | message Timex { 392 | optional string value = 1; 393 | optional string altValue = 2; 394 | optional string text = 3; 395 | optional string type = 4; 396 | optional string tid = 5; 397 | optional uint32 beginPoint = 6; 398 | optional uint32 endPoint = 7; 399 | } 400 | 401 | // 402 | // A representation of an entity in a relation. 403 | // This corresponds to the EntityMention, and more broadly the 404 | // ExtractionObject classes. 405 | // 406 | message Entity { 407 | optional uint32 headStart = 6; 408 | optional uint32 headEnd = 7; 409 | optional string mentionType = 8; 410 | optional string normalizedName = 9; 411 | optional uint32 headTokenIndex = 10; 412 | optional string corefID = 11; 413 | // inherited from ExtractionObject 414 | optional string objectID = 1; 415 | optional uint32 extentStart = 2; 416 | optional uint32 extentEnd = 3; 417 | optional string type = 4; 418 | optional string subtype = 5; 419 | // Implicit 420 | // uint32 sentence @see implicit in sentence 421 | } 422 | 423 | // 424 | // A representation of a relation, mirroring RelationMention 425 | // 426 | message Relation { 427 | repeated string argName = 6; 428 | repeated Entity arg = 7; 429 | optional string signature = 8; 430 | // inherited from ExtractionObject 431 | optional string objectID = 1; 432 | optional uint32 extentStart = 2; 433 | optional uint32 extentEnd = 3; 434 | optional string type = 4; 435 | optional string subtype = 5; 436 | // Implicit 437 | // uint32 sentence @see implicit in sentence 438 | } 439 | 440 | // 441 | // A Natural Logic operator 442 | // 443 | message Operator { 444 | required string name = 1; 445 | required int32 quantifierSpanBegin = 2; 446 | required int32 quantifierSpanEnd = 3; 447 | required int32 subjectSpanBegin = 4; 448 | required int32 subjectSpanEnd = 5; 449 | required int32 objectSpanBegin = 6; 450 | required int32 objectSpanEnd = 7; 451 | } 452 | 453 | // 454 | // The seven informative Natural Logic relations 455 | // 456 | enum NaturalLogicRelation { 457 | EQUIVALENCE = 0; 458 | FORWARD_ENTAILMENT = 1; 459 | REVERSE_ENTAILMENT = 2; 460 | NEGATION = 3; 461 | ALTERNATION = 4; 462 | COVER = 5; 463 | INDEPENDENCE = 6; 464 | } 465 | 466 | // 467 | // The polarity of a word, according to Natural Logic 468 | // 469 | message Polarity { 470 | required NaturalLogicRelation projectEquivalence = 1; 471 | required NaturalLogicRelation projectForwardEntailment = 2; 472 | required NaturalLogicRelation projectReverseEntailment = 3; 473 | required NaturalLogicRelation projectNegation = 4; 474 | required NaturalLogicRelation projectAlternation = 5; 475 | required NaturalLogicRelation projectCover = 6; 476 | required NaturalLogicRelation projectIndependence = 7; 477 | } 478 | 479 | // 480 | // An NER mention in the text 481 | // 482 | message NERMention { 483 | optional uint32 sentenceIndex = 1; 484 | required uint32 tokenStartInSentenceInclusive = 2; 485 | required uint32 tokenEndInSentenceExclusive = 3; 486 | required string ner = 4; 487 | optional string normalizedNER = 5; 488 | optional string entityType = 6; 489 | optional Timex timex = 7; 490 | optional string wikipediaEntity = 8; 491 | optional string gender = 9; 492 | optional uint32 entityMentionIndex = 10; 493 | optional uint32 canonicalEntityMentionIndex = 11; 494 | optional string entityMentionText = 12; 495 | } 496 | 497 | // 498 | // An entailed sentence fragment. 499 | // Created by the openie annotator. 500 | // 501 | message SentenceFragment { 502 | repeated uint32 tokenIndex = 1; 503 | optional uint32 root = 2; 504 | optional bool assumedTruth = 3; 505 | optional double score = 4; 506 | } 507 | 508 | 509 | // 510 | // The index of a token in a document, including the sentence 511 | // index and the offset. 512 | // 513 | message TokenLocation { 514 | optional uint32 sentenceIndex = 1; 515 | optional uint32 tokenIndex = 2; 516 | 517 | } 518 | 519 | 520 | // 521 | // An OpenIE relation triple. 522 | // Created by the openie annotator. 523 | // 524 | message RelationTriple { 525 | optional string subject = 1; // The surface form of the subject 526 | optional string relation = 2; // The surface form of the relation (required) 527 | optional string object = 3; // The surface form of the object 528 | optional double confidence = 4; // The [optional] confidence of the extraction 529 | repeated TokenLocation subjectTokens = 13; // The tokens comprising the subject of the triple 530 | repeated TokenLocation relationTokens = 14; // The tokens comprising the relation of the triple 531 | repeated TokenLocation objectTokens = 15; // The tokens comprising the object of the triple 532 | optional DependencyGraph tree = 8; // The dependency graph fragment for this triple 533 | optional bool istmod = 9; // If true, this expresses an implicit tmod relation 534 | optional bool prefixBe = 10; // If true, this relation string is missing a 'be' prefix 535 | optional bool suffixBe = 11; // If true, this relation string is missing a 'be' suffix 536 | optional bool suffixOf = 12; // If true, this relation string is missing a 'of' prefix 537 | } 538 | 539 | 540 | // 541 | // A map from strings to strings. 542 | // Used, minimally, in the CoNLLU featurizer 543 | // 544 | message MapStringString { 545 | repeated string key = 1; 546 | repeated string value = 2; 547 | } 548 | 549 | // 550 | // A map from integers to strings. 551 | // Used, minimally, in the CoNLLU featurizer 552 | // 553 | message MapIntString { 554 | repeated uint32 key = 1; 555 | repeated string value = 2; 556 | } 557 | 558 | // 559 | // Store section info 560 | // 561 | 562 | message Section { 563 | required uint32 charBegin = 1; 564 | required uint32 charEnd = 2; 565 | optional string author = 3; 566 | repeated uint32 sentenceIndexes = 4; 567 | optional string datetime = 5; 568 | repeated Quote quotes = 6; 569 | optional uint32 authorCharBegin = 7; 570 | optional uint32 authorCharEnd = 8; 571 | required Token xmlTag = 9; 572 | } 573 | 574 | -------------------------------------------------------------------------------- /setup.cfg: -------------------------------------------------------------------------------- 1 | [bdist_wheel] 2 | # This flag says that the code is written to work on both Python 2 and Python 3 | # 3. If at all possible, it is good practice to do this. If you cannot, you 4 | # will need to generate wheels for each Python version that you support. 5 | universal=1 6 | -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- 1 | """A setuptools based setup module. 2 | 3 | See: 4 | https://packaging.python.org/en/latest/distributing.html 5 | https://github.com/pypa/sampleproject 6 | """ 7 | 8 | from os import path 9 | # Always prefer setuptools over distutils 10 | from setuptools import setup, find_packages 11 | # To use a consistent encoding 12 | from codecs import open 13 | 14 | here = path.abspath(path.dirname(__file__)) 15 | 16 | # Get the long description from the README file 17 | with open(path.join(here, 'README.rst'), encoding='utf-8') as f: 18 | long_description = f.read() 19 | 20 | setup( 21 | name='corenlp-protobuf', 22 | 23 | # Versions should comply with PEP440. For a discussion on single-sourcing 24 | # the version across setup.py and the project code, see 25 | # https://packaging.python.org/en/latest/single_source_version.html 26 | version='3.9.1', 27 | 28 | description='Python bindings for Stanford CoreNLP protobufs', 29 | long_description=long_description, 30 | 31 | # The project's main homepage. 32 | url='https://github.com/stanfordnlp/python-corenlp-protobuf', 33 | 34 | # Author details 35 | author='Stanford NLP Group', 36 | author_email='chaganty@cs.stanford.edu', 37 | 38 | # Choose your license 39 | license='MIT', 40 | 41 | # See https://pypi.python.org/pypi?%3Aaction=list_classifiers 42 | classifiers=[ 43 | # How mature is this project? Common values are 44 | # 3 - Alpha 45 | # 4 - Beta 46 | # 5 - Production/Stable 47 | 'Development Status :: 5 - Production/Stable', 48 | 49 | # Indicate who your project is intended for 50 | 'Intended Audience :: Developers', 51 | 'Topic :: Software Development :: Object Brokering', 52 | 53 | # Pick your license as you wish (should match "license" above) 54 | 'License :: OSI Approved :: MIT License', 55 | 56 | # Specify the Python versions you support here. In particular, ensure 57 | # that you indicate whether you support Python 2, Python 3 or both. 58 | 'Programming Language :: Python :: 2', 59 | 'Programming Language :: Python :: 2.7', 60 | 'Programming Language :: Python :: 3', 61 | 'Programming Language :: Python :: 3.3', 62 | 'Programming Language :: Python :: 3.4', 63 | 'Programming Language :: Python :: 3.5', 64 | ], 65 | 66 | # What does your project relate to? 67 | keywords='protobuf corenlp natural-language-processing nlp', 68 | 69 | # You can just specify the packages manually here if your project is 70 | # simple. Or you can use find_packages(). 71 | packages=find_packages(exclude=['contrib', 'docs', 'tests']), 72 | 73 | # Alternatively, if you want to distribute just a my_module.py, uncomment 74 | # this: 75 | #py_modules=["corenlp_protobuf"], 76 | 77 | # List run-time dependencies here. These will be installed by pip when 78 | # your project is installed. For an analysis of "install_requires" vs pip's 79 | # requirements files see: 80 | # https://packaging.python.org/en/latest/requirements.html 81 | install_requires=['protobuf'], 82 | 83 | # List additional groups of dependencies here (e.g. development 84 | # dependencies). You can install these using the following syntax, 85 | # for example: 86 | # $ pip install -e .[dev,test] 87 | extras_require={ 88 | 'dev': ['check-manifest'], 89 | 'test': ['coverage'], 90 | }, 91 | 92 | # If there are data files included in your packages that need to be 93 | # installed, specify them here. If using Python 2.6 or less, then these 94 | # have to be included in MANIFEST.in as well. 95 | package_data={ 96 | }, 97 | 98 | # Although 'package_data' is the preferred approach, in some case you may 99 | # need to place data files outside of your packages. See: 100 | # http://docs.python.org/3.4/distutils/setupscript.html#installing-additional-files # noqa 101 | # In this case, 'data_file' will be installed into '/my_data' 102 | data_files=[], 103 | 104 | # To provide executable scripts, use entry points in preference to the 105 | # "scripts" keyword. Entry points provide cross-platform support and allow 106 | # pip to create the appropriate form of executable for the target platform. 107 | entry_points={ 108 | }, 109 | ) 110 | -------------------------------------------------------------------------------- /tests/__init__.py: -------------------------------------------------------------------------------- 1 | # the inclusion of the tests module is not meant to offer best practices for 2 | # testing in general, but rather to support the `find_packages` example in 3 | # setup.py that excludes installing the "tests" package 4 | -------------------------------------------------------------------------------- /tests/data/test.dat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stanfordnlp/python-corenlp-protobuf/508284aa16afaedba57e0e18dd82ebb6ec63101a/tests/data/test.dat -------------------------------------------------------------------------------- /tests/test_read.py: -------------------------------------------------------------------------------- 1 | """ 2 | Tests to read a stored protobuf. 3 | Also serves as an example of how to parse sentences, tokens, pos, lemma, 4 | ner, dependencies and mentions. 5 | 6 | The test corresponds to annotations for the following sentence: 7 | Chris wrote a simple sentence that he parsed with Stanford CoreNLP. 8 | """ 9 | 10 | import os 11 | from pytest import fixture 12 | from corenlp_protobuf import Document, Sentence, Token, DependencyGraph,\ 13 | CorefChain 14 | from corenlp_protobuf import parseFromDelimitedString, writeToDelimitedString, to_text 15 | 16 | 17 | # Thext that was annotated 18 | TEXT = "Chris wrote a simple sentence that he parsed with Stanford CoreNLP.\n" 19 | 20 | 21 | @fixture 22 | def doc_pb(): 23 | test_dir = os.path.dirname(os.path.abspath(__file__)) 24 | test_data = os.path.join(test_dir, 'data', 'test.dat') 25 | with open(test_data, 'rb') as f: 26 | buf = f.read() 27 | doc = Document() 28 | parseFromDelimitedString(doc, buf) 29 | return doc 30 | 31 | def test_parse_protobuf(doc_pb): 32 | assert doc_pb.ByteSize() == 4239 33 | 34 | def test_write_protobuf(doc_pb): 35 | stream = writeToDelimitedString(doc_pb) 36 | buf = stream.getvalue() 37 | stream.close() 38 | 39 | doc_pb_ = Document() 40 | parseFromDelimitedString(doc_pb_, buf) 41 | assert doc_pb == doc_pb_ 42 | 43 | def test_document_text(doc_pb): 44 | assert doc_pb.text == TEXT 45 | 46 | 47 | def test_sentences(doc_pb): 48 | assert len(doc_pb.sentence) == 1 49 | 50 | sentence = doc_pb.sentence[0] 51 | assert isinstance(sentence, Sentence) 52 | # check sentence length 53 | assert sentence.characterOffsetEnd - sentence.characterOffsetBegin == 67 54 | # Note that the sentence text should actually be recovered from the tokens. 55 | assert sentence.text == '' 56 | assert to_text(sentence) == TEXT[:-1] 57 | 58 | 59 | def test_tokens(doc_pb): 60 | sentence = doc_pb.sentence[0] 61 | tokens = sentence.token 62 | assert len(tokens) == 12 63 | assert isinstance(tokens[0], Token) 64 | 65 | # Word 66 | words = "Chris wrote a simple sentence that he parsed with Stanford CoreNLP .".split() 67 | words_ = [t.word for t in tokens] 68 | assert words_ == words 69 | 70 | # Lemma 71 | lemmas = "Chris write a simple sentence that he parse with Stanford CoreNLP .".split() 72 | lemmas_ = [t.lemma for t in tokens] 73 | assert lemmas_ == lemmas 74 | 75 | # POS 76 | pos = "NNP VBD DT JJ NN IN PRP VBD IN NNP NNP .".split() 77 | pos_ = [t.pos for t in tokens] 78 | assert pos_ == pos 79 | 80 | # NER 81 | ner = "PERSON O O O O O O O O ORGANIZATION O O".split() 82 | ner_ = [t.ner for t in tokens] 83 | assert ner_ == ner 84 | 85 | # character offsets 86 | begin = [int(i) for i in "0 6 12 14 21 30 35 38 45 50 59 66".split()] 87 | end = [int(i) for i in "5 11 13 20 29 34 37 44 49 58 66 67".split()] 88 | begin_ = [t.beginChar for t in tokens] 89 | end_ = [t.endChar for t in tokens] 90 | assert begin_ == begin 91 | assert end_ == end 92 | 93 | 94 | def test_dependency_parse(doc_pb): 95 | """ 96 | Extract the dependency parse from the annotation. 97 | """ 98 | sentence = doc_pb.sentence[0] 99 | 100 | # You can choose from the following types of dependencies. 101 | # In general, you'll want enhancedPlusPlus 102 | assert sentence.basicDependencies.ByteSize() > 0 103 | assert sentence.enhancedDependencies.ByteSize() > 0 104 | assert sentence.enhancedPlusPlusDependencies.ByteSize() > 0 105 | 106 | tree = sentence.enhancedPlusPlusDependencies 107 | isinstance(tree, DependencyGraph) 108 | # Indices are 1-indexd with 0 being the "pseudo root" 109 | assert tree.root # 'wrote' is the root. == [2] 110 | # There are as many nodes as there are tokens. 111 | assert len(tree.node) == len(sentence.token) 112 | 113 | # Enhanced++ depdencies often contain additional edges and are 114 | # not trees -- here, 'parsed' would also have an edge to 115 | # 'sentence' 116 | assert len(tree.edge) == 12 117 | 118 | # This edge goes from "wrote" to "Chirs" 119 | edge = tree.edge[0] 120 | assert edge.source == 2 121 | assert edge.target == 1 122 | assert edge.dep == "nsubj" 123 | 124 | 125 | def test_coref_chain(doc_pb): 126 | """ 127 | Extract the corefence chains from the annotation. 128 | """ 129 | # Coreference chains span sentences and are stored in the 130 | # document. 131 | chains = doc_pb.corefChain 132 | 133 | # In this document there is 1 chain with Chris and he. 134 | assert len(chains) == 1 135 | chain = chains[0] 136 | assert isinstance(chain, CorefChain) 137 | assert chain.mention[0].beginIndex == 0 # 'Chris' 138 | assert chain.mention[0].endIndex == 1 139 | assert chain.mention[0].gender == "MALE" 140 | 141 | assert chain.mention[1].beginIndex == 6 # 'he' 142 | assert chain.mention[1].endIndex == 7 143 | assert chain.mention[1].gender == "MALE" 144 | 145 | assert chain.representative == 0 # Head of the chain is 'Chris' 146 | -------------------------------------------------------------------------------- /tox.ini: -------------------------------------------------------------------------------- 1 | # this file is *not* meant to cover or endorse the use of tox or pytest or 2 | # testing in general, 3 | # 4 | # It's meant to show the use of: 5 | # 6 | # - check-manifest 7 | # confirm items checked into vcs are in your sdist 8 | # - python setup.py check (using the readme_renderer extension) 9 | # confirms your long_description will render correctly on pypi 10 | # 11 | # and also to help confirm pull requests to this project. 12 | 13 | [tox] 14 | envlist = py{27,33,35} 15 | 16 | [testenv] 17 | basepython = 18 | py27: python2.7 19 | py33: python3.3 20 | py35: python3.5 21 | deps = 22 | check-manifest 23 | readme_renderer 24 | pytest 25 | protobuf 26 | commands = 27 | check-manifest --ignore tox.ini,tests* 28 | python setup.py check -m -r -s 29 | py.test tests 30 | [flake8] 31 | exclude = .tox,*.egg,build,data 32 | select = E,W,F 33 | --------------------------------------------------------------------------------