git-annex in ntq8312@kibo:/data/ntq8312/ml_measurement_error_public
This commit is contained in:
parent
5c931a7198
commit
c42b94110b
@ -11,16 +11,17 @@ API_KEY = open('perspective_api_key').read()
|
|||||||
|
|
||||||
client = discovery.build("commentanalyzer","v1alpha",developerKey=API_KEY,discoveryServiceUrl="https://commentanalyzer.googleapis.com/$discovery/rest?version=v1alpha1",static_discovery=False,)
|
client = discovery.build("commentanalyzer","v1alpha",developerKey=API_KEY,discoveryServiceUrl="https://commentanalyzer.googleapis.com/$discovery/rest?version=v1alpha1",static_discovery=False,)
|
||||||
|
|
||||||
csvreader = csv.DictReader(open("all_data.csv"))
|
csvreader = csv.DictReader(open("all_data.csv"), dialect='unix')
|
||||||
|
|
||||||
outfile = Path("perspective_results.json")
|
outfile = Path("perspective_results.json")
|
||||||
already_scored = set()
|
already_scored = set()
|
||||||
if outfile.exists():
|
if outfile.exists():
|
||||||
already_scored = set([json.loads(l)['id'] for l in open(str(outfile),'r')])
|
already_scored = set([json.loads(l)['id'] for l in open(str(outfile),'r')])
|
||||||
|
|
||||||
with open("perspective_results.json",'w') as of:
|
print(f"loaded {len(already_scored)} scored comments")
|
||||||
|
with open("perspective_results.json",'a') as of:
|
||||||
for line in csvreader:
|
for line in csvreader:
|
||||||
if line['id'] not in already_scored:
|
if line['id'] not in already_scored and len(line.get('comment_text','')) > 0:
|
||||||
analyze_request = {'comment':{'text':line['comment_text']},
|
analyze_request = {'comment':{'text':line['comment_text']},
|
||||||
'languages':['en'],
|
'languages':['en'],
|
||||||
'requestedAttributes':{'TOXICITY':{},
|
'requestedAttributes':{'TOXICITY':{},
|
||||||
|
1
civil_comments/perspective_results.json
Symbolic link
1
civil_comments/perspective_results.json
Symbolic link
@ -0,0 +1 @@
|
|||||||
|
../.git/annex/objects/ZV/z8/SHA256E-s2293825121--6cdc8f8fb64fad2e51027e2564928e8938bf5fc6ca0cd6c31cb2e67aafe0a203.json/SHA256E-s2293825121--6cdc8f8fb64fad2e51027e2564928e8938bf5fc6ca0cd6c31cb2e67aafe0a203.json
|
Loading…
Reference in New Issue
Block a user