forked from KEMT/zpwiki
		
	update
This commit is contained in:
		
							parent
							
								
									d3442d01f7
								
							
						
					
					
						commit
						893a25d5f0
					
				| @ -1,14 +1,60 @@ | |||||||
| # load data | # load data | ||||||
| filename = 'ner/annotations.jsonl' | 
 | ||||||
|  | filename = 'ner/skner/skner.jsonl' | ||||||
| file = open(filename, 'rt', encoding='utf-8') | file = open(filename, 'rt', encoding='utf-8') | ||||||
| text = file.read() | text = file.read() | ||||||
| 
 | 
 | ||||||
| # count entity PER | # count articles | ||||||
|  | countAccept = text.count('accept') | ||||||
|  | countReject = text.count('reject') | ||||||
|  | countSkip = text.count('ignore') | ||||||
|  | countSpans = text.count('tokens') | ||||||
|  | # count entities | ||||||
| countPER = text.count('PER') | countPER = text.count('PER') | ||||||
| countLOC = text.count('LOC') | countLOC = text.count('LOC') | ||||||
| countORG = text.count('ORG') | countORG = text.count('ORG') | ||||||
| countMISC = text.count('MISC') | countMISC = text.count('MISC') | ||||||
| print('Počet anotovaných entít typu PER:', countPER,'\n',  | 
 | ||||||
|       'Počet anotovaných entít typu LOC:', countLOC,'\n', | underline = '\033[04m' | ||||||
|       'Počet anotovaných entít typu ORG:', countORG,'\n', | reset = '\033[0m' | ||||||
|       'Počet anotovaných entít typu MISC:', countMISC,'\n') | red = '\033[31m' | ||||||
|  | green='\033[32m' | ||||||
|  | gray='\033[37m' | ||||||
|  | 
 | ||||||
|  | # table v1 | ||||||
|  | #from lib import TableIt | ||||||
|  | #table1 = [     | ||||||
|  | #    ['Prijatých', countAccept],    | ||||||
|  | #    ['Zamietnutých', countReject], | ||||||
|  | #    ['Preskočených', countSkip], | ||||||
|  | #    ['------------', '------------'], | ||||||
|  | #    ['Spolu', countSpans] | ||||||
|  | #] | ||||||
|  | # | ||||||
|  | #table = [     | ||||||
|  | #    ['Entita', 'Počet'],    | ||||||
|  | #    ['PER', countPER], | ||||||
|  | #    ['LOC', countLOC], | ||||||
|  | #    ['ORG', countORG], | ||||||
|  | #    ['MISC', countMISC] | ||||||
|  | #] | ||||||
|  | #print('\nPočet anotovaných článkov:') | ||||||
|  | #TableIt.printTable(table1) | ||||||
|  | #print('\nPočet jednotlivých entít:') | ||||||
|  | #TableIt.printTable(table, useFieldNames=True, color=(26, 156, 171)) | ||||||
|  | 
 | ||||||
|  | # table v2 | ||||||
|  | print(underline + '\nPočet anotovaných článkov:' + reset) | ||||||
|  | print(green + "%-15s %-20s" %("Prijatých", countAccept) + reset) | ||||||
|  | print(red + "%-15s %-15s" %("Zamietnutých", countReject) + reset) | ||||||
|  | print(gray + "%-15s %-15s" %("Preskočených", countSkip) + reset) | ||||||
|  | print("%-15s" %("---------------------")) | ||||||
|  | print("%-15s %-15s" %("Spolu", countSpans)) | ||||||
|  | 
 | ||||||
|  | print(underline + '\nPočet jednotlivých entít:' + reset) | ||||||
|  | print("%-10s %-10s" %("Entita:", "Počet:")) | ||||||
|  | print("%-10s" %("----------------")) | ||||||
|  | print("%-10s %-10s" %("PER", countPER)) | ||||||
|  | print("%-10s %-10s" %("LOC", countLOC)) | ||||||
|  | print("%-10s %-10s" %("ORG", countORG)) | ||||||
|  | print("%-10s %-10s" %("MISC", countMISC)) | ||||||
		Loading…
	
		Reference in New Issue
	
	Block a user