git-annex in ntq8312@kibo:/data/ntq8312/ml_measurement_error_public
This commit is contained in:
		
							parent
							
								
									5c931a7198
								
							
						
					
					
						commit
						c42b94110b
					
				| @ -11,16 +11,17 @@ API_KEY = open('perspective_api_key').read() | |||||||
| 
 | 
 | ||||||
| client = discovery.build("commentanalyzer","v1alpha",developerKey=API_KEY,discoveryServiceUrl="https://commentanalyzer.googleapis.com/$discovery/rest?version=v1alpha1",static_discovery=False,) | client = discovery.build("commentanalyzer","v1alpha",developerKey=API_KEY,discoveryServiceUrl="https://commentanalyzer.googleapis.com/$discovery/rest?version=v1alpha1",static_discovery=False,) | ||||||
| 
 | 
 | ||||||
| csvreader = csv.DictReader(open("all_data.csv")) | csvreader = csv.DictReader(open("all_data.csv"), dialect='unix') | ||||||
| 
 | 
 | ||||||
| outfile = Path("perspective_results.json") | outfile = Path("perspective_results.json") | ||||||
| already_scored = set() | already_scored = set() | ||||||
| if outfile.exists(): | if outfile.exists(): | ||||||
|     already_scored = set([json.loads(l)['id'] for l in open(str(outfile),'r')]) |     already_scored = set([json.loads(l)['id'] for l in open(str(outfile),'r')]) | ||||||
| 
 | 
 | ||||||
| with open("perspective_results.json",'w') as of: | print(f"loaded {len(already_scored)} scored comments") | ||||||
|  | with open("perspective_results.json",'a') as of: | ||||||
|     for line in csvreader: |     for line in csvreader: | ||||||
|         if line['id'] not in already_scored: |         if line['id'] not in already_scored and len(line.get('comment_text','')) > 0: | ||||||
|             analyze_request = {'comment':{'text':line['comment_text']}, |             analyze_request = {'comment':{'text':line['comment_text']}, | ||||||
|                                'languages':['en'], |                                'languages':['en'], | ||||||
|                                'requestedAttributes':{'TOXICITY':{}, |                                'requestedAttributes':{'TOXICITY':{}, | ||||||
|  | |||||||
							
								
								
									
										1
									
								
								civil_comments/perspective_results.json
									
									
									
									
									
										Symbolic link
									
								
							
							
						
						
									
										1
									
								
								civil_comments/perspective_results.json
									
									
									
									
									
										Symbolic link
									
								
							| @ -0,0 +1 @@ | |||||||
|  | ../.git/annex/objects/ZV/z8/SHA256E-s2293825121--6cdc8f8fb64fad2e51027e2564928e8938bf5fc6ca0cd6c31cb2e67aafe0a203.json/SHA256E-s2293825121--6cdc8f8fb64fad2e51027e2564928e8938bf5fc6ca0cd6c31cb2e67aafe0a203.json | ||||||
		Loading…
	
		Reference in New Issue
	
	Block a user