
AwardsSharePlayers table
AwardsSharePlayers.RdAward voting for managers awards
Usage
data(AwardsSharePlayers)Format
A data frame with 7523 observations on the following 7 variables.
awardIDname of award votes were received for
yearIDYear
lgIDLeague; a factor with levels
ALMLNLplayerIDPlayer ID code
pointsWonNumber of points received
pointsMaxMaximum number of points possible
votesFirstNumber of first place votes
Source
Lahman, S. (2025) Lahman's Baseball Database, 1871-2024, 2025 version, https://sabr.org/lahman-database/
Examples
# Vote tallies for post-season player awards
require("dplyr")
# Which awards are represented in this data frame?
unique(AwardsSharePlayers$awardID)
#> [1] "Rookie of the Year" "Most Valuable Player" "Cy Young Award"
# Sort the votes for the Cy Young award in decreasing order.
# Until 1967, the award went to the best pitcher
# in both leagues.
cyvotes <- AwardsSharePlayers %>%
filter(awardID == "Cy Young") %>%
group_by(yearID, lgID) %>%
arrange(desc(pointsWon))
# 2012 votes
subset(cyvotes, yearID == 2012)
#> # A tibble: 0 × 7
#> # Groups: yearID, lgID [0]
#> # ℹ 7 variables: awardID <chr>, yearID <int>, lgID <fct>, playerID <chr>,
#> # pointsWon <int>, pointsMax <int>, votesFirst <int>
# top three votegetters each year by league
cya_top3 <- cyvotes %>%
group_by(yearID, lgID) %>%
do(head(., 3))
head(cya_top3, 12)
#> # A tibble: 0 × 7
#> # Groups: yearID, lgID [0]
#> # ℹ 7 variables: awardID <chr>, yearID <int>, lgID <fct>, playerID <chr>,
#> # pointsWon <int>, pointsMax <int>, votesFirst <int>
# unanimous Cy Young winners
subset(cyvotes, pointsWon == pointsMax)
#> # A tibble: 0 × 7
#> # Groups: yearID, lgID [0]
#> # ℹ 7 variables: awardID <chr>, yearID <int>, lgID <fct>, playerID <chr>,
#> # pointsWon <int>, pointsMax <int>, votesFirst <int>
## CYA was a major league award until 1967
# Find top five pitchers with most top 3 vote tallies in CYA
# head(with(cya_top3, rev(sort(table(playerID)))), 5)
# Pre-1967
cya_top3 %>%
filter(yearID <= 1966) %>%
group_by(playerID) %>%
summarise(yrs_top3 = n()) %>%
arrange(desc(yrs_top3)) %>%
head(., 2)
#> # A tibble: 0 × 2
#> # ℹ 2 variables: playerID <chr>, yrs_top3 <int>
# 1967+ (both leagues)
cya_top3 %>%
filter(yearID > 1966) %>%
group_by(playerID) %>%
summarise(yrs_top3 = n()) %>%
arrange(desc(yrs_top3)) %>%
head(., 5)
#> # A tibble: 0 × 2
#> # ℹ 2 variables: playerID <chr>, yrs_top3 <int>
# 1967+ (by league)
cya_top3 %>%
filter(yearID > 1966) %>%
group_by(playerID, lgID) %>%
summarise(yrs_top3 = n()) %>%
arrange(desc(yrs_top3)) %>%
head(., 5)
#> `summarise()` has grouped output by 'playerID'. You can override using the
#> `.groups` argument.
#> # A tibble: 0 × 3
#> # Groups: playerID [0]
#> # ℹ 3 variables: playerID <chr>, lgID <fct>, yrs_top3 <int>
# Ditto for MVP awards
# Top 3 votegetters for MVP award by year and league
MVP_top3 <- AwardsSharePlayers %>%
filter(awardID == "MVP") %>%
group_by(yearID, lgID) %>%
arrange(desc(pointsWon)) %>%
do(head(., 3))
tail(MVP_top3)
#> # A tibble: 0 × 7
#> # Groups: yearID, lgID [0]
#> # ℹ 7 variables: awardID <chr>, yearID <int>, lgID <fct>, playerID <chr>,
#> # pointsWon <int>, pointsMax <int>, votesFirst <int>
## Select players with >= 7 top 3 finishes
MVP_top3 %>%
group_by(playerID) %>%
summarise(n_top3 = n()) %>%
arrange(desc(n_top3)) %>%
filter(n_top3 > 6)
#> # A tibble: 0 × 2
#> # ℹ 2 variables: playerID <chr>, n_top3 <int>