add stuff to get perspective scores from civil comments
This commit is contained in:
		
							parent
							
								
									d0c5766bdf
								
							
						
					
					
						commit
						e17a52e236
					
				
							
								
								
									
										1
									
								
								civil_comments/all_data.csv
									
									
									
									
									
										Symbolic link
									
								
							
							
						
						
									
										1
									
								
								civil_comments/all_data.csv
									
									
									
									
									
										Symbolic link
									
								
							| @ -0,0 +1 @@ | |||||||
|  | ../.git/annex/objects/6v/fJ/SHA256E-s916052376--a85b5ba7e9a8cda38b91ea6e3957a4f2bfff17bb52f22c935595cbe47cc54d94.csv/SHA256E-s916052376--a85b5ba7e9a8cda38b91ea6e3957a4f2bfff17bb52f22c935595cbe47cc54d94.csv | ||||||
| 
 | 
							
								
								
									
										38
									
								
								civil_comments/get_perspective_scores.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										38
									
								
								civil_comments/get_perspective_scores.py
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,38 @@ | |||||||
|  | from googleapiclient import discovery | ||||||
|  | import json | ||||||
|  | import csv | ||||||
|  | from pathlib import Path | ||||||
|  | 
 | ||||||
|  | from time import sleep | ||||||
|  | 
 | ||||||
|  | from itertools import islice | ||||||
|  | 
 | ||||||
|  | API_KEY = open('perspective_api_key').read() | ||||||
|  | 
 | ||||||
|  | client = discovery.build("commentanalyzer","v1alpha",developerKey=API_KEY,discoveryServiceUrl="https://commentanalyzer.googleapis.com/$discovery/rest?version=v1alpha1",static_discovery=False,) | ||||||
|  | 
 | ||||||
|  | csvreader = csv.DictReader(open("all_data.csv")) | ||||||
|  | 
 | ||||||
|  | outfile = Path("perspective_results.json") | ||||||
|  | already_scored = set() | ||||||
|  | if outfile.exists(): | ||||||
|  |     already_scored = set([json.loads(l)['id'] for l in open(str(outfile),'r')]) | ||||||
|  | 
 | ||||||
|  | with open("perspective_results.json",'w') as of: | ||||||
|  |     for line in csvreader: | ||||||
|  |         if line['id'] not in already_scored: | ||||||
|  |             analyze_request = {'comment':{'text':line['comment_text']}, | ||||||
|  |                                'languages':['en'], | ||||||
|  |                                'requestedAttributes':{'TOXICITY':{}, | ||||||
|  |                                                       "SEVERE_TOXICITY":{}, | ||||||
|  |                                                       "IDENTITY_ATTACK":{}, | ||||||
|  |                                                       "INSULT":{}, | ||||||
|  |                                                       "PROFANITY":{}, | ||||||
|  |                                                       "THREAT":{}}} | ||||||
|  |             response = client.comments().analyze(body=analyze_request).execute() | ||||||
|  |             response['id'] = line['id'] | ||||||
|  |             result = json.dumps(response) | ||||||
|  |             of.write(result + '\n') | ||||||
|  |             of.flush() | ||||||
|  | 
 | ||||||
|  |             sleep(0.10) | ||||||
							
								
								
									
										1
									
								
								civil_comments/identity_individual_annotations.csv
									
									
									
									
									
										Symbolic link
									
								
							
							
						
						
									
										1
									
								
								civil_comments/identity_individual_annotations.csv
									
									
									
									
									
										Symbolic link
									
								
							| @ -0,0 +1 @@ | |||||||
|  | ../.git/annex/objects/qP/Xw/SHA256E-s106388260--7b8e9f21c5110d32e337137f8b4fe50987ec1b59fdbfd56a4717cdc13e509ec3.csv/SHA256E-s106388260--7b8e9f21c5110d32e337137f8b4fe50987ec1b59fdbfd56a4717cdc13e509ec3.csv | ||||||
| 
 | 
							
								
								
									
										
											BIN
										
									
								
								civil_comments/perspective_api_key.gpg
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										
											BIN
										
									
								
								civil_comments/perspective_api_key.gpg
									
									
									
									
									
										Normal file
									
								
							
										
											Binary file not shown.
										
									
								
							
							
								
								
									
										1
									
								
								civil_comments/toxicity_individual_annotations.csv
									
									
									
									
									
										Symbolic link
									
								
							
							
						
						
									
										1
									
								
								civil_comments/toxicity_individual_annotations.csv
									
									
									
									
									
										Symbolic link
									
								
							| @ -0,0 +1 @@ | |||||||
|  | ../.git/annex/objects/FF/WZ/SHA256E-s417648663--c85bda15b964a24869ae11f76092bde6f4b18236dd1cbe17539526b3b5b736cf.csv/SHA256E-s417648663--c85bda15b964a24869ae11f76092bde6f4b18236dd1cbe17539526b3b5b736cf.csv | ||||||
| 
 | 
		Loading…
	
		Reference in New Issue
	
	Block a user