add stuff to get perspective scores from civil comments
This commit is contained in:
		
							parent
							
								
									d0c5766bdf
								
							
						
					
					
						commit
						e17a52e236
					
				
							
								
								
									
										1
									
								
								civil_comments/all_data.csv
									
									
									
									
									
										Symbolic link
									
								
							
							
						
						
									
										1
									
								
								civil_comments/all_data.csv
									
									
									
									
									
										Symbolic link
									
								
							| @ -0,0 +1 @@ | ||||
| ../.git/annex/objects/6v/fJ/SHA256E-s916052376--a85b5ba7e9a8cda38b91ea6e3957a4f2bfff17bb52f22c935595cbe47cc54d94.csv/SHA256E-s916052376--a85b5ba7e9a8cda38b91ea6e3957a4f2bfff17bb52f22c935595cbe47cc54d94.csv | ||||
| 
 | 
							
								
								
									
										38
									
								
								civil_comments/get_perspective_scores.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										38
									
								
								civil_comments/get_perspective_scores.py
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,38 @@ | ||||
| from googleapiclient import discovery | ||||
| import json | ||||
| import csv | ||||
| from pathlib import Path | ||||
| 
 | ||||
| from time import sleep | ||||
| 
 | ||||
| from itertools import islice | ||||
| 
 | ||||
| API_KEY = open('perspective_api_key').read() | ||||
| 
 | ||||
| client = discovery.build("commentanalyzer","v1alpha",developerKey=API_KEY,discoveryServiceUrl="https://commentanalyzer.googleapis.com/$discovery/rest?version=v1alpha1",static_discovery=False,) | ||||
| 
 | ||||
| csvreader = csv.DictReader(open("all_data.csv")) | ||||
| 
 | ||||
| outfile = Path("perspective_results.json") | ||||
| already_scored = set() | ||||
| if outfile.exists(): | ||||
|     already_scored = set([json.loads(l)['id'] for l in open(str(outfile),'r')]) | ||||
| 
 | ||||
| with open("perspective_results.json",'w') as of: | ||||
|     for line in csvreader: | ||||
|         if line['id'] not in already_scored: | ||||
|             analyze_request = {'comment':{'text':line['comment_text']}, | ||||
|                                'languages':['en'], | ||||
|                                'requestedAttributes':{'TOXICITY':{}, | ||||
|                                                       "SEVERE_TOXICITY":{}, | ||||
|                                                       "IDENTITY_ATTACK":{}, | ||||
|                                                       "INSULT":{}, | ||||
|                                                       "PROFANITY":{}, | ||||
|                                                       "THREAT":{}}} | ||||
|             response = client.comments().analyze(body=analyze_request).execute() | ||||
|             response['id'] = line['id'] | ||||
|             result = json.dumps(response) | ||||
|             of.write(result + '\n') | ||||
|             of.flush() | ||||
| 
 | ||||
|             sleep(0.10) | ||||
							
								
								
									
										1
									
								
								civil_comments/identity_individual_annotations.csv
									
									
									
									
									
										Symbolic link
									
								
							
							
						
						
									
										1
									
								
								civil_comments/identity_individual_annotations.csv
									
									
									
									
									
										Symbolic link
									
								
							| @ -0,0 +1 @@ | ||||
| ../.git/annex/objects/qP/Xw/SHA256E-s106388260--7b8e9f21c5110d32e337137f8b4fe50987ec1b59fdbfd56a4717cdc13e509ec3.csv/SHA256E-s106388260--7b8e9f21c5110d32e337137f8b4fe50987ec1b59fdbfd56a4717cdc13e509ec3.csv | ||||
| 
 | 
							
								
								
									
										
											BIN
										
									
								
								civil_comments/perspective_api_key.gpg
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										
											BIN
										
									
								
								civil_comments/perspective_api_key.gpg
									
									
									
									
									
										Normal file
									
								
							
										
											Binary file not shown.
										
									
								
							
							
								
								
									
										1
									
								
								civil_comments/toxicity_individual_annotations.csv
									
									
									
									
									
										Symbolic link
									
								
							
							
						
						
									
										1
									
								
								civil_comments/toxicity_individual_annotations.csv
									
									
									
									
									
										Symbolic link
									
								
							| @ -0,0 +1 @@ | ||||
| ../.git/annex/objects/FF/WZ/SHA256E-s417648663--c85bda15b964a24869ae11f76092bde6f4b18236dd1cbe17539526b3b5b736cf.csv/SHA256E-s417648663--c85bda15b964a24869ae11f76092bde6f4b18236dd1cbe17539526b3b5b736cf.csv | ||||
| 
 | 
		Loading…
	
		Reference in New Issue
	
	Block a user