add examples using the translations data

This commit is contained in:
Nathan TeBlunthuis 2020-03-31 16:56:59 -07:00
parent c8b886364f
commit 8bb3db8b46
2 changed files with 30 additions and 0 deletions

View File

@ -0,0 +1,17 @@
## example reading latest file straight from the server
df <- read.csv("https://covid19.communitydata.science/datasets/keywords/csv/latest.csv")
## make the data more R-friendly
df$is.alt <- df$is_alt == "True"
df$is_alt <- NULL
## find all translations for coronavirus
coronavirus.itemids <- df[ (tolower(df$label) == "coronavirus") &
(df$langcode == 'en')
,"itemid"]
## there are actually 5 item ids. The one referring to the family of virus is Q57751738
coronavirus.translations <- df[df$itemid == "http://www.wikidata.org/entity/Q57751738",]
## let's only look at non-aliases
print(coronavirus.translations[c(coronavirus.translations$is.alt == FALSE), c("label","langcode")])

View File

@ -0,0 +1,13 @@
import pandas as pd
# read the latest dataset
df = pd.read_csv("https://covid19.communitydata.science/datasets/keywords/csv/latest.csv")
# find translations of "coronavirus"
coronavirus_itemids = df.loc[df.label.str.lower() == "coronavirus"]
# there are actually 5 item ids. The one referring to the family of virus is Q57751738
coronavirus_translations = df.loc[df.itemid == "http://www.wikidata.org/entity/Q57751738"]
# let's only look at unique, non-aliases
print(coronavirus_translations.loc[df.is_alt == False,['label','langcode']])