Refine, analyse, integrate & visualize metadata
+Refine, integrate and analyse Finna metadata
Source:vignettes/articles/refinemetadata.Rmd
@@ -66,6 +66,11 @@ Introduction
+
+Refine using refine_metadata()
+function
+
library(finna)
sibelius_data <- search_finna("sibelius")
@@ -85,7 +90,41 @@ Introduction## 9 Sibelius Lampi… 1984 fin Kirja,… Sibeliu… Kansal… Unkno…
## 10 Sibelius Tawas… 1997 fin Kirja,… Sibeliu… Kansal… Unkno…
## # ℹ 90 more rows
+
+
+
+integrate using integrate_metadata()
+Function
+
+finna_data <- search_finna("sibelius")
+other_data <- tibble::tibble(
+ Title = c("Sibelius Symphony No. 5", "Finlandia", "Valse Triste"),
+ Rating = c(5, 4, 3)
+)
+integrated_data <- integrate_metadata(finna_data, other_data, key = "Title")
+print(integrated_data)
+## # A tibble: 103 × 9
+## Title Author Year Language Formats Subjects Library Series Rating
+## <chr> <chr> <chr> <chr> <chr> <chr> <chr> <chr> <dbl>
+## 1 Sibelius favour… Sibel… 2001 NA Äänite… orkeste… Lapin … NA NA
+## 2 Sibelius Tappe… 1967 NA Taidet… NA Jyväsk… NA NA
+## 3 Sibelius Favén… NA NA Taidet… kaljuus… Lahden… NA NA
+## 4 Sibelius Tawas… 2003 fin Kirja,… Sibeliu… Anders… NA NA
+## 5 Sibelius Ringb… 1948 fin Kirja,… Sibeliu… Eepos-… NA NA
+## 6 SIBELIUS TÖRNE… 1945 fin Kirja,… SIBELIU… Helle-… NA NA
+## 7 Sibelius Lampi… 1995 fin Kirja,… Sibeliu… Kansal… NA NA
+## 8 Sibelius Lampi… 2005 fin Kirja,… Sibeliu… Kansal… NA NA
+## 9 Sibelius Lampi… 1984 fin Kirja,… Sibeliu… Kansal… NA NA
+## 10 Sibelius Tawas… 1997 fin Kirja,… Sibeliu… Kansal… NA NA
+## # ℹ 93 more rows
+
+
+
+Analyze using analyze_metadata()
+Function
+
+
sibelius_data <- search_finna("sibelius")
refined_data <- refine_metadata(sibelius_data)
analysis_results <- analyze_metadata(refined_data)
@@ -136,79 +175,85 @@ Introduction## 9 Barnett, Andrew 2
## 10 Gray, Cecil 2
## # ℹ 44 more rows
-
+
+
+1. Applying the visualize_year_distribution()
+Function
+
+
sibelius_data <- search_finna("sibelius")
refined_data <- refine_metadata(sibelius_data)
analysis_results <- analyze_metadata(refined_data)
visualize_year_distribution(analysis_results$year_distribution)
-
+
+
-1. Applying the visualize_top_20_titles()
+2. Applying the visualize_top_20_titles()
Function
This function will visualize the top 20 titles from your dataset.
-
+
# Assuming you have a tibble with Finna metadata called `refined_data`
top_20_titles_plot <- visualize_top_20_titles(refined_data)
# To display the plot
print(top_20_titles_plot)
-
+
-2. Applying the visualize_format_distribution()
+3. Applying the visualize_format_distribution()
Function
This function visualizes the distribution of the records by
format.
-
+
# Plot the format distribution
format_distribution_plot <- visualize_format_distribution(refined_data)
# To display the plot
print(format_distribution_plot)
-
+
-3. Applying the
+4. Applying the
visualize_library_distribution()
Function
This function shows the distribution of the records by library.
-
+
# Plot the library distribution
library_distribution_plot <- visualize_library_distribution(refined_data)
# To display the plot
print(library_distribution_plot)
-
+
-4. Applying the visualize_author_distribution()
+5. Applying the visualize_author_distribution()
Function
This function visualizes the distribution of the records by
author.
-
+
# Plot the author distribution
author_distribution_plot <- visualize_author_distribution(refined_data)
# To display the plot
print(author_distribution_plot)
-
+
-5. Applying the
+6. Applying the
visualize_subject_distribution()
Function
This function visualizes the distribution of the records by
subject.
-
+
# Plot the subject distribution
subject_distribution_plot <- visualize_subject_distribution(refined_data)
# To display the plot
print(subject_distribution_plot)
-
+
refine_metadata()
+function
+
library(finna)
sibelius_data <- search_finna("sibelius")
@@ -85,7 +90,41 @@ Introduction## 9 Sibelius Lampi… 1984 fin Kirja,… Sibeliu… Kansal… Unkno…
## 10 Sibelius Tawas… 1997 fin Kirja,… Sibeliu… Kansal… Unkno…
## # ℹ 90 more rows
+
+integrate using integrate_metadata()
+Function
+
+finna_data <- search_finna("sibelius")
+other_data <- tibble::tibble(
+ Title = c("Sibelius Symphony No. 5", "Finlandia", "Valse Triste"),
+ Rating = c(5, 4, 3)
+)
+integrated_data <- integrate_metadata(finna_data, other_data, key = "Title")
+print(integrated_data)
## # A tibble: 103 × 9
+## Title Author Year Language Formats Subjects Library Series Rating
+## <chr> <chr> <chr> <chr> <chr> <chr> <chr> <chr> <dbl>
+## 1 Sibelius favour… Sibel… 2001 NA Äänite… orkeste… Lapin … NA NA
+## 2 Sibelius Tappe… 1967 NA Taidet… NA Jyväsk… NA NA
+## 3 Sibelius Favén… NA NA Taidet… kaljuus… Lahden… NA NA
+## 4 Sibelius Tawas… 2003 fin Kirja,… Sibeliu… Anders… NA NA
+## 5 Sibelius Ringb… 1948 fin Kirja,… Sibeliu… Eepos-… NA NA
+## 6 SIBELIUS TÖRNE… 1945 fin Kirja,… SIBELIU… Helle-… NA NA
+## 7 Sibelius Lampi… 1995 fin Kirja,… Sibeliu… Kansal… NA NA
+## 8 Sibelius Lampi… 2005 fin Kirja,… Sibeliu… Kansal… NA NA
+## 9 Sibelius Lampi… 1984 fin Kirja,… Sibeliu… Kansal… NA NA
+## 10 Sibelius Tawas… 1997 fin Kirja,… Sibeliu… Kansal… NA NA
+## # ℹ 93 more rows
+
+Analyze using analyze_metadata()
+Function
+
+
sibelius_data <- search_finna("sibelius")
refined_data <- refine_metadata(sibelius_data)
analysis_results <- analyze_metadata(refined_data)
@@ -136,79 +175,85 @@ Introduction## 9 Barnett, Andrew 2
## 10 Gray, Cecil 2
## # ℹ 44 more rows
-+
1. Applying the visualize_year_distribution()
+Function
+
+
sibelius_data <- search_finna("sibelius")
refined_data <- refine_metadata(sibelius_data)
analysis_results <- analyze_metadata(refined_data)
visualize_year_distribution(analysis_results$year_distribution)
1. Applying the visualize_top_20_titles()
+2. Applying the visualize_top_20_titles()
Function
This function will visualize the top 20 titles from your dataset.
-
+
# Assuming you have a tibble with Finna metadata called `refined_data`
top_20_titles_plot <- visualize_top_20_titles(refined_data)
# To display the plot
print(top_20_titles_plot)
-
+
-2. Applying the visualize_format_distribution()
+3. Applying the visualize_format_distribution()
Function
This function visualizes the distribution of the records by
format.
-
+
# Plot the format distribution
format_distribution_plot <- visualize_format_distribution(refined_data)
# To display the plot
print(format_distribution_plot)
-
+
-3. Applying the
+4. Applying the
visualize_library_distribution()
Function
This function shows the distribution of the records by library.
-
+
# Plot the library distribution
library_distribution_plot <- visualize_library_distribution(refined_data)
# To display the plot
print(library_distribution_plot)
-
+
-4. Applying the visualize_author_distribution()
+5. Applying the visualize_author_distribution()
Function
This function visualizes the distribution of the records by
author.
-
+
# Plot the author distribution
author_distribution_plot <- visualize_author_distribution(refined_data)
# To display the plot
print(author_distribution_plot)
-
+
-5. Applying the
+6. Applying the
visualize_subject_distribution()
Function
This function visualizes the distribution of the records by
subject.
-
+
# Plot the subject distribution
subject_distribution_plot <- visualize_subject_distribution(refined_data)
# To display the plot
print(subject_distribution_plot)
-
+
visualize_top_20_titles()
Function
+- +# Assuming you have a tibble with Finna metadata called `refined_data` top_20_titles_plot <- visualize_top_20_titles(refined_data) # To display the plot print(top_20_titles_plot)
2. Applying the visualize_format_distribution()
+3. Applying the visualize_format_distribution()
Function
This function visualizes the distribution of the records by
format.
-
+
# Plot the format distribution
format_distribution_plot <- visualize_format_distribution(refined_data)
# To display the plot
print(format_distribution_plot)
-
+
-3. Applying the
+4. Applying the
visualize_library_distribution()
Function
This function shows the distribution of the records by library.
-
+
# Plot the library distribution
library_distribution_plot <- visualize_library_distribution(refined_data)
# To display the plot
print(library_distribution_plot)
-
+
-4. Applying the visualize_author_distribution()
+5. Applying the visualize_author_distribution()
Function
This function visualizes the distribution of the records by
author.
-
+
# Plot the author distribution
author_distribution_plot <- visualize_author_distribution(refined_data)
# To display the plot
print(author_distribution_plot)
-
+
-5. Applying the
+6. Applying the
visualize_subject_distribution()
Function
This function visualizes the distribution of the records by
subject.
-
+
# Plot the subject distribution
subject_distribution_plot <- visualize_subject_distribution(refined_data)
# To display the plot
print(subject_distribution_plot)
-
+
visualize_format_distribution()
Function
+- +# Plot the format distribution format_distribution_plot <- visualize_format_distribution(refined_data) # To display the plot print(format_distribution_plot)
3. Applying the
+4. Applying the
visualize_library_distribution()
Function
This function shows the distribution of the records by library.
-
+
# Plot the library distribution
library_distribution_plot <- visualize_library_distribution(refined_data)
# To display the plot
print(library_distribution_plot)
-
+
-4. Applying the visualize_author_distribution()
+5. Applying the visualize_author_distribution()
Function
This function visualizes the distribution of the records by
author.
-
+
# Plot the author distribution
author_distribution_plot <- visualize_author_distribution(refined_data)
# To display the plot
print(author_distribution_plot)
-
+
-5. Applying the
+6. Applying the
visualize_subject_distribution()
Function
This function visualizes the distribution of the records by
subject.
-
+
# Plot the subject distribution
subject_distribution_plot <- visualize_subject_distribution(refined_data)
# To display the plot
print(subject_distribution_plot)
-
+
visualize_library_distribution()
Function
+- +# Plot the library distribution library_distribution_plot <- visualize_library_distribution(refined_data) # To display the plot print(library_distribution_plot)
4. Applying the visualize_author_distribution()
+5. Applying the visualize_author_distribution()
Function
This function visualizes the distribution of the records by
author.
-
+
# Plot the author distribution
author_distribution_plot <- visualize_author_distribution(refined_data)
# To display the plot
print(author_distribution_plot)
-
+
-5. Applying the
+6. Applying the
visualize_subject_distribution()
Function
This function visualizes the distribution of the records by
subject.
-
+
# Plot the subject distribution
subject_distribution_plot <- visualize_subject_distribution(refined_data)
# To display the plot
print(subject_distribution_plot)
-
+
visualize_author_distribution()
Function
+- +# Plot the author distribution author_distribution_plot <- visualize_author_distribution(refined_data) # To display the plot print(author_distribution_plot)
5. Applying the
+6. Applying the
visualize_subject_distribution()
Function
This function visualizes the distribution of the records by
subject.
-
+
# Plot the subject distribution
subject_distribution_plot <- visualize_subject_distribution(refined_data)
# To display the plot
print(subject_distribution_plot)
-
+
visualize_subject_distribution()
Function
+- +# Plot the subject distribution subject_distribution_plot <- visualize_subject_distribution(refined_data) # To display the plot print(subject_distribution_plot)