import csv import os import nltk import pandas as pd from statistics import mean, median import json def metadata_for_file(file): word_list = file.split() word_count = len(word_list) #print(word_list) if word_count == 0: avg_word_length = 0 else: avg_word_length = sum(map(len, word_list)) / len(word_list) #return number of paragraphs return word_count, avg_word_length