1
0

updating with c3 viz for dependency depth

This commit is contained in:
Matthew Gaughan 2025-07-01 15:58:05 -07:00
parent a4d8685c13
commit 6c477f3d49
5 changed files with 59 additions and 41 deletions

View File

@ -181,3 +181,6 @@ ls
cd case3
ls
rm 062725_c3_title_cleaned.csv
ls
ls ../case2
ls ../case1

View File

@ -18,7 +18,7 @@
"metadata": {},
"outputs": [],
"source": [
"phab_path = \"/mmfs1/gscratch/comdata/users/mjilg/mw-repo-lifecycles/case3/0422_http_phab_comments.csv\"\n",
"phab_path = \"/mmfs1/gscratch/comdata/users/mjilg/mw-repo-lifecycles/case3/050825_coref-rel-final.csv\"\n",
"phab_df = pd.read_csv(phab_path)"
]
},
@ -1004,7 +1004,7 @@
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.11.11"
"version": "3.13.5"
}
},
"nbformat": 4,

Binary file not shown.

After

Width:  |  Height:  |  Size: 71 KiB

File diff suppressed because one or more lines are too long

View File

@ -0,0 +1,23 @@
library(tidyverse)
c1_count <-"/mmfs1/gscratch/comdata/users/mjilg/mw-repo-lifecycles/case1/0312_resolved_ve_phab_comments.csv"
c1_input_df <- read.csv(c1_count , header = TRUE)
c2_count <-"/mmfs1/gscratch/comdata/users/mjilg/mw-repo-lifecycles/case2/051825_coref_resolved_dep_trees.csv"
c2_input_df <- read.csv(c2_count , header = TRUE)
c3_count <-"/mmfs1/gscratch/comdata/users/mjilg/mw-repo-lifecycles/case3/050825_coref-rel-final.csv"
c3_input_df <- read.csv(c3_count , header = TRUE)
# Add a column to each dataframe to label them
c1_input_df <- c1_input_df |> mutate(source = "c1")
c2_input_df <- c2_input_df %>% mutate(source = "c2")
c3_input_df <- c3_input_df %>% mutate(source = "c3")
# Combine the dataframes into one
combined_df <- bind_rows(c1_input_df, c2_input_df, c3_input_df)
library(stringr)
combined_df$user_in_text <- str_count(combined_df$text, regex("user", ignore_case = TRUE))
combined_df$user_in_resolved_text <- str_count(combined_df$resolved_text, regex("user", ignore_case = TRUE))