from ucrel_api.ucrel_token import UCREL_Token

DOC_TOKENS = [UCREL_Token('hello', pos_tag='UH', usas_tag='Z4'), 
              UCREL_Token('how', 'RRQ', 'Z5'), 
              UCREL_Token('are', 'VBR', 'A3+'), UCREL_Token('you', 'PPY', 'Z8mf'),
              UCREL_Token('.', '.', None), UCREL_Token('I', 'PPIS1', 'Z8mf'),
              UCREL_Token('am', 'VBM', 'A3+'), UCREL_Token('great', 'JJ', 'A5.1+'),
              UCREL_Token('thanks', 'NN2', 'S1.2.4+'), UCREL_Token('.', '.', None)]

example_doc = UCREL_Doc(text='hello how are you. I am great thanks.',
                        tokens=DOC_TOKENS, sentence_indexes=[(0,5), (5,10)])

example_doc

UCREL Doc (2 sentences):
First 3 tokens:
UCREL Token: hello	POS tag: UH	USAS tag: Z4
UCREL Token: how	Lemma: RRQ	POS tag: Z5
UCREL Token: are	Lemma: VBR	POS tag: A3+

for index, sentence in enumerate(example_doc.sentences):
    print(f'Sentence {index}:')
    for token in sentence:
        print(f'{token}')
    if index == 0:
        print('\n')

Sentence 0:
UCREL Token: hello	POS tag: UH	USAS tag: Z4
UCREL Token: how	Lemma: RRQ	POS tag: Z5
UCREL Token: are	Lemma: VBR	POS tag: A3+
UCREL Token: you	Lemma: PPY	POS tag: Z8mf
UCREL Token: .	Lemma: .


Sentence 1:
UCREL Token: I	Lemma: PPIS1	POS tag: Z8mf
UCREL Token: am	Lemma: VBM	POS tag: A3+
UCREL Token: great	Lemma: JJ	POS tag: A5.1+
UCREL Token: thanks	Lemma: NN2	POS tag: S1.2.4+
UCREL Token: .	Lemma: .

for index, token in enumerate(example_doc):
    print(f'{index} {token}')

0 UCREL Token: hello	POS tag: UH	USAS tag: Z4
1 UCREL Token: how	Lemma: RRQ	POS tag: Z5
2 UCREL Token: are	Lemma: VBR	POS tag: A3+
3 UCREL Token: you	Lemma: PPY	POS tag: Z8mf
4 UCREL Token: .	Lemma: .
5 UCREL Token: I	Lemma: PPIS1	POS tag: Z8mf
6 UCREL Token: am	Lemma: VBM	POS tag: A3+
7 UCREL Token: great	Lemma: JJ	POS tag: A5.1+
8 UCREL Token: thanks	Lemma: NN2	POS tag: S1.2.4+
9 UCREL Token: .	Lemma: .

example_doc[-2]

UCREL Token: thanks	Lemma: NN2	POS tag: S1.2.4+

len(example_doc)

10

assert example_doc == UCREL_Doc(text='hello how are you. I am great thanks.',
                                tokens=DOC_TOKENS, 
                                sentence_indexes=[(0,5), (5,10)])

example_without_sent_indexes = UCREL_Doc(text='hello how are you. I am great thanks.',
                                         tokens=DOC_TOKENS)
assert example_doc != example_without_sent_indexes

try:
    {'text': 'hello how are you. I am great thanks.', 
     'tokens': DOC_TOKENS, 'sentence_indexes': [(0,5), (5,10)]} == example_doc
except NotImplementedError:
    print('UCREL_Doc instances can only be compared '
          'with other UCREL_Doc instances:')

UCREL_Doc instances can only be compared with other UCREL_Doc instances:

example_doc.to_json()

'{"text": "hello how are you. I am great thanks.", "tokens": [{"text": "hello", "lemma": null, "pos_tag": "UH", "usas_tag": "Z4", "mwe_tag": null}, {"text": "how", "lemma": "RRQ", "pos_tag": "Z5", "usas_tag": null, "mwe_tag": null}, {"text": "are", "lemma": "VBR", "pos_tag": "A3+", "usas_tag": null, "mwe_tag": null}, {"text": "you", "lemma": "PPY", "pos_tag": "Z8mf", "usas_tag": null, "mwe_tag": null}, {"text": ".", "lemma": ".", "pos_tag": null, "usas_tag": null, "mwe_tag": null}, {"text": "I", "lemma": "PPIS1", "pos_tag": "Z8mf", "usas_tag": null, "mwe_tag": null}, {"text": "am", "lemma": "VBM", "pos_tag": "A3+", "usas_tag": null, "mwe_tag": null}, {"text": "great", "lemma": "JJ", "pos_tag": "A5.1+", "usas_tag": null, "mwe_tag": null}, {"text": "thanks", "lemma": "NN2", "pos_tag": "S1.2.4+", "usas_tag": null, "mwe_tag": null}, {"text": ".", "lemma": ".", "pos_tag": null, "usas_tag": null, "mwe_tag": null}], "sentence_indexes": [[0, 5], [5, 10]]}'

Static Methods

example_doc_json_string = example_doc.to_json()
another_example_doc = UCREL_Doc.from_json(example_doc_json_string)
another_example_doc

UCREL Doc (2 sentences):
First 3 tokens:
UCREL Token: hello	POS tag: UH	USAS tag: Z4
UCREL Token: how	Lemma: RRQ	POS tag: Z5
UCREL Token: are	Lemma: VBR	POS tag: A3+

example_doc == another_example_doc

True

UCREL Doc

`class` `UCREL_Doc`[source]

`UCREL_Doc.init`[source]

`UCREL_Doc.repr`[source]

`UCREL_Doc.sentences`[source]

`UCREL_Doc.iter`[source]

`UCREL_Doc.getitem`[source]

`UCREL_Doc.len`[source]

`UCREL_Doc.eq`[source]

`UCREL_Doc.to_json`[source]

Static Methods

`UCREL_Doc.from_json`[source]

UCREL Doc

class UCREL_Doc[source]

UCREL_Doc.__init__[source]

UCREL_Doc.__repr__[source]

UCREL_Doc.sentences[source]

UCREL_Doc.__iter__[source]

UCREL_Doc.__getitem__[source]

UCREL_Doc.__len__[source]

UCREL_Doc.__eq__[source]

UCREL_Doc.to_json[source]

Static Methods

UCREL_Doc.from_json[source]

`class` `UCREL_Doc`[source]

`UCREL_Doc.init`[source]

`UCREL_Doc.repr`[source]

`UCREL_Doc.sentences`[source]

`UCREL_Doc.iter`[source]

`UCREL_Doc.getitem`[source]

`UCREL_Doc.len`[source]

`UCREL_Doc.eq`[source]

`UCREL_Doc.to_json`[source]

`UCREL_Doc.from_json`[source]