diff --git a/R/examscores.R b/R/examscores.R
new file mode 100644
index 0000000000000000000000000000000000000000..180e7f03a2d51d12522f34190718a96fa3bd9371
--- /dev/null
+++ b/R/examscores.R
@@ -0,0 +1,23 @@
+
+#' This data set includes scores from three tests of students at a (fictional) public school and a variety of personal and socio-economic factors that may have interaction effects upon them. 
+#'
+#'
+#' @format A dataframe, 29069 observations, 15 variables
+#' \describe{
+#' \item{\code{Gender}}{Gender of a student (string)}
+#' \item{\code{EthnicGroup}}{Origin of a student (string)}
+#' \item{\code{ParentEduc}}{Parents education (string)}
+#' \item{\code{LunchType}}{Type of lunch (string)}
+#' \item{\code{TestPrep}}{Preparation for a test (string)}
+#' \item{\code{ParentMaritalStatus}}{Parental marital status (string)}
+#' \item{\code{PracticeSport}}{Practice sports (string)}
+#' \item{\code{IsFirstChild}}{Firstborn (boolean)}
+#' \item{\code{NrSiblings}}{Number of siblings (integer)}
+#' \item{\code{TransportMeans}}{Means of transport to school (string)}
+#' \item{\code{WklyStudyHours}}{Number of study hours per week (integer)}
+#' \item{\code{MathScore}}{Score in math (integer)}
+#' \item{\code{ReadingScore}}{Score in reading (integer)}
+#' \item{\code{WritingScore}}{Score in writing (integer)}
+#'}
+
+"examscores"
diff --git a/README.md b/README.md
index 91c168778e0a212c18880019007e46bbec1b8956..6ccfc1afcbc858aeb52102e7001f07c5f311410b 100644
--- a/README.md
+++ b/README.md
@@ -12,6 +12,8 @@ Package for the exam of the course "Data Science for Socioeconomists" at the dep
 
 -   *census_2015* with aggregated census data of american households regarding their income and sociodemographic characteristics.
 
+-   *examscores* includes information about educational data and models a fictional school and its students
+
 -   *examscores2* is an updated version of *examscores*. It includes information about educational data and models a fictional school and its students
 
 -   *income_data* includes information about people's age and their income - it models a fictional population
@@ -23,16 +25,12 @@ Either:\
 #library(remotes)\
 remotes::install_gitlab("BAQ6370/sozoekdsexam", host="gitlab.rrz.uni-hamburg.de", force = TRUE)
 
-library(sozoekdsexam)
-
 or:
 
 #install.packages("devtools")\
 #library(devtools)\
 devtools::install_git("[https://gitlab.rrz.uni-hamburg.de/baq6370/sozoekdsexam.git](https://gitlab.rrz.uni-hamburg.de/bay1977/sozoeko1.git)", force = TRUE)
 
-library(sozoekdsexam)
-
 ## Support
 
 If you find a bug please contact: [lisamarie.wegner\@uni-hamburg.de](lisamarie.wegner@uni-hamburg.de)
diff --git a/data-raw/examscores.RData b/data-raw/examscores.RData
new file mode 100644
index 0000000000000000000000000000000000000000..4bbfafde52c0358efea61af7207d0d754582a67f
Binary files /dev/null and b/data-raw/examscores.RData differ
diff --git a/data-raw/examscores_load.R b/data-raw/examscores_load.R
new file mode 100644
index 0000000000000000000000000000000000000000..014f5edfaa212ffb082d1f335f467080098ab1df
--- /dev/null
+++ b/data-raw/examscores_load.R
@@ -0,0 +1,11 @@
+
+## code to prepare `examscores` dataset goes here
+
+library(devtools)
+library(roxygen2)
+library(dplyr)
+
+examscores_neu<- newdata %>% select(-high_mathscore)
+examscores <- examscores_neu
+usethis::use_data(examscores, overwrite = TRUE)
+
diff --git a/data/examscores.rda b/data/examscores.rda
new file mode 100644
index 0000000000000000000000000000000000000000..4ed9233ec699dbdce9dd3c8cf7339e8aff5af5e9
Binary files /dev/null and b/data/examscores.rda differ
diff --git a/man/examscores.Rd b/man/examscores.Rd
new file mode 100644
index 0000000000000000000000000000000000000000..b73e92a14ecb013a871993431b6caa842f7cc790
--- /dev/null
+++ b/man/examscores.Rd
@@ -0,0 +1,32 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/examscores.R
+\docType{data}
+\name{examscores}
+\alias{examscores}
+\title{This data set includes scores from three tests of students at a (fictional) public school and a variety of personal and socio-economic factors that may have interaction effects upon them.}
+\format{
+A dataframe, 29069 observations, 15 variables
+\describe{
+\item{\code{Gender}}{Gender of a student (string)}
+\item{\code{EthnicGroup}}{Origin of a student (string)}
+\item{\code{ParentEduc}}{Parents education (string)}
+\item{\code{LunchType}}{Type of lunch (string)}
+\item{\code{TestPrep}}{Preparation for a test (string)}
+\item{\code{ParentMaritalStatus}}{Parental marital status (string)}
+\item{\code{PracticeSport}}{Practice sports (string)}
+\item{\code{IsFirstChild}}{Firstborn (boolean)}
+\item{\code{NrSiblings}}{Number of siblings (integer)}
+\item{\code{TransportMeans}}{Means of transport to school (string)}
+\item{\code{WklyStudyHours}}{Number of study hours per week (integer)}
+\item{\code{MathScore}}{Score in math (integer)}
+\item{\code{ReadingScore}}{Score in reading (integer)}
+\item{\code{WritingScore}}{Score in writing (integer)}
+}
+}
+\usage{
+examscores
+}
+\description{
+This data set includes scores from three tests of students at a (fictional) public school and a variety of personal and socio-economic factors that may have interaction effects upon them.
+}
+\keyword{datasets}