update
This commit is contained in:
parent
d3442d01f7
commit
893a25d5f0
@ -1,14 +1,60 @@
|
|||||||
# load data
|
# load data
|
||||||
filename = 'ner/annotations.jsonl'
|
|
||||||
|
filename = 'ner/skner/skner.jsonl'
|
||||||
file = open(filename, 'rt', encoding='utf-8')
|
file = open(filename, 'rt', encoding='utf-8')
|
||||||
text = file.read()
|
text = file.read()
|
||||||
|
|
||||||
# count entity PER
|
# count articles
|
||||||
|
countAccept = text.count('accept')
|
||||||
|
countReject = text.count('reject')
|
||||||
|
countSkip = text.count('ignore')
|
||||||
|
countSpans = text.count('tokens')
|
||||||
|
# count entities
|
||||||
countPER = text.count('PER')
|
countPER = text.count('PER')
|
||||||
countLOC = text.count('LOC')
|
countLOC = text.count('LOC')
|
||||||
countORG = text.count('ORG')
|
countORG = text.count('ORG')
|
||||||
countMISC = text.count('MISC')
|
countMISC = text.count('MISC')
|
||||||
print('Počet anotovaných entít typu PER:', countPER,'\n',
|
|
||||||
'Počet anotovaných entít typu LOC:', countLOC,'\n',
|
underline = '\033[04m'
|
||||||
'Počet anotovaných entít typu ORG:', countORG,'\n',
|
reset = '\033[0m'
|
||||||
'Počet anotovaných entít typu MISC:', countMISC,'\n')
|
red = '\033[31m'
|
||||||
|
green='\033[32m'
|
||||||
|
gray='\033[37m'
|
||||||
|
|
||||||
|
# table v1
|
||||||
|
#from lib import TableIt
|
||||||
|
#table1 = [
|
||||||
|
# ['Prijatých', countAccept],
|
||||||
|
# ['Zamietnutých', countReject],
|
||||||
|
# ['Preskočených', countSkip],
|
||||||
|
# ['------------', '------------'],
|
||||||
|
# ['Spolu', countSpans]
|
||||||
|
#]
|
||||||
|
#
|
||||||
|
#table = [
|
||||||
|
# ['Entita', 'Počet'],
|
||||||
|
# ['PER', countPER],
|
||||||
|
# ['LOC', countLOC],
|
||||||
|
# ['ORG', countORG],
|
||||||
|
# ['MISC', countMISC]
|
||||||
|
#]
|
||||||
|
#print('\nPočet anotovaných článkov:')
|
||||||
|
#TableIt.printTable(table1)
|
||||||
|
#print('\nPočet jednotlivých entít:')
|
||||||
|
#TableIt.printTable(table, useFieldNames=True, color=(26, 156, 171))
|
||||||
|
|
||||||
|
# table v2
|
||||||
|
print(underline + '\nPočet anotovaných článkov:' + reset)
|
||||||
|
print(green + "%-15s %-20s" %("Prijatých", countAccept) + reset)
|
||||||
|
print(red + "%-15s %-15s" %("Zamietnutých", countReject) + reset)
|
||||||
|
print(gray + "%-15s %-15s" %("Preskočených", countSkip) + reset)
|
||||||
|
print("%-15s" %("---------------------"))
|
||||||
|
print("%-15s %-15s" %("Spolu", countSpans))
|
||||||
|
|
||||||
|
print(underline + '\nPočet jednotlivých entít:' + reset)
|
||||||
|
print("%-10s %-10s" %("Entita:", "Počet:"))
|
||||||
|
print("%-10s" %("----------------"))
|
||||||
|
print("%-10s %-10s" %("PER", countPER))
|
||||||
|
print("%-10s %-10s" %("LOC", countLOC))
|
||||||
|
print("%-10s %-10s" %("ORG", countORG))
|
||||||
|
print("%-10s %-10s" %("MISC", countMISC))
|
Loading…
Reference in New Issue
Block a user