add stuff to get perspective scores from civil comments
This commit is contained in:
parent
d0c5766bdf
commit
e17a52e236
1
civil_comments/all_data.csv
Symbolic link
1
civil_comments/all_data.csv
Symbolic link
@ -0,0 +1 @@
|
|||||||
|
../.git/annex/objects/6v/fJ/SHA256E-s916052376--a85b5ba7e9a8cda38b91ea6e3957a4f2bfff17bb52f22c935595cbe47cc54d94.csv/SHA256E-s916052376--a85b5ba7e9a8cda38b91ea6e3957a4f2bfff17bb52f22c935595cbe47cc54d94.csv
|
|
38
civil_comments/get_perspective_scores.py
Normal file
38
civil_comments/get_perspective_scores.py
Normal file
@ -0,0 +1,38 @@
|
|||||||
|
from googleapiclient import discovery
|
||||||
|
import json
|
||||||
|
import csv
|
||||||
|
from pathlib import Path
|
||||||
|
|
||||||
|
from time import sleep
|
||||||
|
|
||||||
|
from itertools import islice
|
||||||
|
|
||||||
|
API_KEY = open('perspective_api_key').read()
|
||||||
|
|
||||||
|
client = discovery.build("commentanalyzer","v1alpha",developerKey=API_KEY,discoveryServiceUrl="https://commentanalyzer.googleapis.com/$discovery/rest?version=v1alpha1",static_discovery=False,)
|
||||||
|
|
||||||
|
csvreader = csv.DictReader(open("all_data.csv"))
|
||||||
|
|
||||||
|
outfile = Path("perspective_results.json")
|
||||||
|
already_scored = set()
|
||||||
|
if outfile.exists():
|
||||||
|
already_scored = set([json.loads(l)['id'] for l in open(str(outfile),'r')])
|
||||||
|
|
||||||
|
with open("perspective_results.json",'w') as of:
|
||||||
|
for line in csvreader:
|
||||||
|
if line['id'] not in already_scored:
|
||||||
|
analyze_request = {'comment':{'text':line['comment_text']},
|
||||||
|
'languages':['en'],
|
||||||
|
'requestedAttributes':{'TOXICITY':{},
|
||||||
|
"SEVERE_TOXICITY":{},
|
||||||
|
"IDENTITY_ATTACK":{},
|
||||||
|
"INSULT":{},
|
||||||
|
"PROFANITY":{},
|
||||||
|
"THREAT":{}}}
|
||||||
|
response = client.comments().analyze(body=analyze_request).execute()
|
||||||
|
response['id'] = line['id']
|
||||||
|
result = json.dumps(response)
|
||||||
|
of.write(result + '\n')
|
||||||
|
of.flush()
|
||||||
|
|
||||||
|
sleep(0.10)
|
1
civil_comments/identity_individual_annotations.csv
Symbolic link
1
civil_comments/identity_individual_annotations.csv
Symbolic link
@ -0,0 +1 @@
|
|||||||
|
../.git/annex/objects/qP/Xw/SHA256E-s106388260--7b8e9f21c5110d32e337137f8b4fe50987ec1b59fdbfd56a4717cdc13e509ec3.csv/SHA256E-s106388260--7b8e9f21c5110d32e337137f8b4fe50987ec1b59fdbfd56a4717cdc13e509ec3.csv
|
|
BIN
civil_comments/perspective_api_key.gpg
Normal file
BIN
civil_comments/perspective_api_key.gpg
Normal file
Binary file not shown.
1
civil_comments/toxicity_individual_annotations.csv
Symbolic link
1
civil_comments/toxicity_individual_annotations.csv
Symbolic link
@ -0,0 +1 @@
|
|||||||
|
../.git/annex/objects/FF/WZ/SHA256E-s417648663--c85bda15b964a24869ae11f76092bde6f4b18236dd1cbe17539526b3b5b736cf.csv/SHA256E-s417648663--c85bda15b964a24869ae11f76092bde6f4b18236dd1cbe17539526b3b5b736cf.csv
|
|
Loading…
Reference in New Issue
Block a user