add examples using the translations data
This commit is contained in:
parent
c8b886364f
commit
8bb3db8b46
17
keywords/analysis/translations_example.R
Normal file
17
keywords/analysis/translations_example.R
Normal file
@ -0,0 +1,17 @@
|
|||||||
|
## example reading latest file straight from the server
|
||||||
|
df <- read.csv("https://covid19.communitydata.science/datasets/keywords/csv/latest.csv")
|
||||||
|
|
||||||
|
## make the data more R-friendly
|
||||||
|
df$is.alt <- df$is_alt == "True"
|
||||||
|
df$is_alt <- NULL
|
||||||
|
|
||||||
|
## find all translations for coronavirus
|
||||||
|
coronavirus.itemids <- df[ (tolower(df$label) == "coronavirus") &
|
||||||
|
(df$langcode == 'en')
|
||||||
|
,"itemid"]
|
||||||
|
|
||||||
|
## there are actually 5 item ids. The one referring to the family of virus is Q57751738
|
||||||
|
coronavirus.translations <- df[df$itemid == "http://www.wikidata.org/entity/Q57751738",]
|
||||||
|
|
||||||
|
## let's only look at non-aliases
|
||||||
|
print(coronavirus.translations[c(coronavirus.translations$is.alt == FALSE), c("label","langcode")])
|
13
keywords/analysis/translations_example.py
Normal file
13
keywords/analysis/translations_example.py
Normal file
@ -0,0 +1,13 @@
|
|||||||
|
import pandas as pd
|
||||||
|
|
||||||
|
# read the latest dataset
|
||||||
|
df = pd.read_csv("https://covid19.communitydata.science/datasets/keywords/csv/latest.csv")
|
||||||
|
|
||||||
|
# find translations of "coronavirus"
|
||||||
|
coronavirus_itemids = df.loc[df.label.str.lower() == "coronavirus"]
|
||||||
|
|
||||||
|
# there are actually 5 item ids. The one referring to the family of virus is Q57751738
|
||||||
|
coronavirus_translations = df.loc[df.itemid == "http://www.wikidata.org/entity/Q57751738"]
|
||||||
|
|
||||||
|
# let's only look at unique, non-aliases
|
||||||
|
print(coronavirus_translations.loc[df.is_alt == False,['label','langcode']])
|
Loading…
Reference in New Issue
Block a user