git-annex in ntq8312@kibo:/data/ntq8312/ml_measurement_error_public
This commit is contained in:
		
							parent
							
								
									5c931a7198
								
							
						
					
					
						commit
						c42b94110b
					
				| @ -11,16 +11,17 @@ API_KEY = open('perspective_api_key').read() | ||||
| 
 | ||||
| client = discovery.build("commentanalyzer","v1alpha",developerKey=API_KEY,discoveryServiceUrl="https://commentanalyzer.googleapis.com/$discovery/rest?version=v1alpha1",static_discovery=False,) | ||||
| 
 | ||||
| csvreader = csv.DictReader(open("all_data.csv")) | ||||
| csvreader = csv.DictReader(open("all_data.csv"), dialect='unix') | ||||
| 
 | ||||
| outfile = Path("perspective_results.json") | ||||
| already_scored = set() | ||||
| if outfile.exists(): | ||||
|     already_scored = set([json.loads(l)['id'] for l in open(str(outfile),'r')]) | ||||
| 
 | ||||
| with open("perspective_results.json",'w') as of: | ||||
| print(f"loaded {len(already_scored)} scored comments") | ||||
| with open("perspective_results.json",'a') as of: | ||||
|     for line in csvreader: | ||||
|         if line['id'] not in already_scored: | ||||
|         if line['id'] not in already_scored and len(line.get('comment_text','')) > 0: | ||||
|             analyze_request = {'comment':{'text':line['comment_text']}, | ||||
|                                'languages':['en'], | ||||
|                                'requestedAttributes':{'TOXICITY':{}, | ||||
|  | ||||
							
								
								
									
										1
									
								
								civil_comments/perspective_results.json
									
									
									
									
									
										Symbolic link
									
								
							
							
						
						
									
										1
									
								
								civil_comments/perspective_results.json
									
									
									
									
									
										Symbolic link
									
								
							| @ -0,0 +1 @@ | ||||
| ../.git/annex/objects/ZV/z8/SHA256E-s2293825121--6cdc8f8fb64fad2e51027e2564928e8938bf5fc6ca0cd6c31cb2e67aafe0a203.json/SHA256E-s2293825121--6cdc8f8fb64fad2e51027e2564928e8938bf5fc6ca0cd6c31cb2e67aafe0a203.json | ||||
		Loading…
	
		Reference in New Issue
	
	Block a user