shelving some of the merge work for now
This commit is contained in:
parent
77fc3ec541
commit
f9c12bb445
17
mgaughan-rstudio-server_29576188.out
Normal file
17
mgaughan-rstudio-server_29576188.out
Normal file
@ -0,0 +1,17 @@
|
|||||||
|
1. SSH tunnel from your workstation using the following command:
|
||||||
|
|
||||||
|
ssh -N -L 8787:n3439:36873 mjilg@klone.hyak.uw.edu
|
||||||
|
|
||||||
|
and point your web browser to http://localhost:8787
|
||||||
|
|
||||||
|
2. log in to RStudio Server using the following credentials:
|
||||||
|
|
||||||
|
user: mjilg
|
||||||
|
password: qv1O0tpb3YCkMtmNIRbg
|
||||||
|
|
||||||
|
When done using RStudio Server, terminate the job by:
|
||||||
|
|
||||||
|
1. Exit the RStudio Session ("power" button in the top right corner of the RStudio window)
|
||||||
|
2. Issue the following command on the login node:
|
||||||
|
|
||||||
|
scancel -f 29576188
|
151688
p2/080425_gerrit_filled_df.csv
Normal file
151688
p2/080425_gerrit_filled_df.csv
Normal file
File diff suppressed because one or more lines are too long
26
p2/df_consolidation.R
Normal file
26
p2/df_consolidation.R
Normal file
@ -0,0 +1,26 @@
|
|||||||
|
library(tidyverse)
|
||||||
|
library(jsonlite)
|
||||||
|
|
||||||
|
main_csv <-"~/p2/071425_master_discussion_data.csv"
|
||||||
|
main_df <- read.csv(main_csv, header = TRUE)
|
||||||
|
|
||||||
|
gerrit_csv <-"~/p2/080425_gerrit_filled_df.csv"
|
||||||
|
gerrit_df <- read.csv(gerrit_csv, header = TRUE)
|
||||||
|
|
||||||
|
library(dplyr)
|
||||||
|
|
||||||
|
gerrit_extracted_df <- gerrit_df |>
|
||||||
|
mutate(
|
||||||
|
jsonfixed = gsub("(?<=\\{|\\[|, )'(\\w+?)'(?=\\s*:)", '"\\1"', selected_gerrit_results, perl = TRUE),
|
||||||
|
jsonfixed = gsub(":(\\s*)'(.*?)'(?=[}\\],])", ':\\1"\\2"', jsonfixed, perl = TRUE),
|
||||||
|
jsonfixed = gsub("(?<=[:\\[,\\{])\\s*'([^']*)'\\s*(?=[,\\}\\]])", '"\\1"', jsonfixed, perl = TRUE),
|
||||||
|
expandedjsonlist = lapply(jsonfixed, fromJSON)
|
||||||
|
)
|
||||||
|
|
||||||
|
# TODO select
|
||||||
|
# gerrit status: categorical
|
||||||
|
# owner_wikimedia: BOOL
|
||||||
|
# LOCa: #
|
||||||
|
# LOCd: #
|
||||||
|
# count_reviewers: #
|
||||||
|
# url: url
|
@ -11,7 +11,7 @@ information_typology = c("EXPECTED BEHAVIOR", "MOTIVATION", "OBSERVED BUG BEHAVI
|
|||||||
"ISSUE CONTENT MANAGEMENT", "ACTION ON ISSUE", "SOCIAL CONVERSATION")
|
"ISSUE CONTENT MANAGEMENT", "ACTION ON ISSUE", "SOCIAL CONVERSATION")
|
||||||
url_extensions = c("GERRIT_URL", "URL")
|
url_extensions = c("GERRIT_URL", "URL")
|
||||||
|
|
||||||
olmo_categorization_csv <-"~/p2/quest/090425_olmo_batched_categorized.csv"
|
(olmo_categorization_csv <-"~/p2/quest/090425_olmo_batched_categorized.csv"
|
||||||
olmo_categorization_df <- read.csv(olmo_categorization_csv, header = TRUE)
|
olmo_categorization_df <- read.csv(olmo_categorization_csv, header = TRUE)
|
||||||
|
|
||||||
olmo_categorization_df <- olmo_categorization_df %>%
|
olmo_categorization_df <- olmo_categorization_df %>%
|
||||||
|
Loading…
Reference in New Issue
Block a user