
AwardsSharePlayers table
AwardsSharePlayers.RdAward voting for managers awards
Usage
data(AwardsSharePlayers)Format
A data frame with 7523 observations on the following 7 variables.
- awardID
- name of award votes were received for 
- yearID
- Year 
- lgID
- League; a factor with levels - AL- ML- NL
- playerID
- Player ID code 
- pointsWon
- Number of points received 
- pointsMax
- Maximum number of points possible 
- votesFirst
- Number of first place votes 
Source
Lahman, S. (2025) Lahman's Baseball Database, 1871-2024, 2025 version, https://sabr.org/lahman-database/
Examples
# Vote tallies for post-season player awards
require("dplyr")
# Which awards are represented in this data frame?
unique(AwardsSharePlayers$awardID)
#> [1] "Rookie of the Year"   "Most Valuable Player" "Cy Young Award"      
# Sort the votes for the Cy Young award in decreasing order.
# Until 1967, the award went to the best pitcher
# in both leagues.
cyvotes <- AwardsSharePlayers %>%
              filter(awardID == "Cy Young") %>%
              group_by(yearID, lgID) %>%
              arrange(desc(pointsWon))
# 2012 votes
subset(cyvotes, yearID == 2012)
#> # A tibble: 0 × 7
#> # Groups:   yearID, lgID [0]
#> # ℹ 7 variables: awardID <chr>, yearID <int>, lgID <fct>, playerID <chr>,
#> #   pointsWon <int>, pointsMax <int>, votesFirst <int>
# top three votegetters each year by league
cya_top3 <- cyvotes %>%
              group_by(yearID, lgID) %>%
              do(head(., 3))
head(cya_top3, 12)
#> # A tibble: 0 × 7
#> # Groups:   yearID, lgID [0]
#> # ℹ 7 variables: awardID <chr>, yearID <int>, lgID <fct>, playerID <chr>,
#> #   pointsWon <int>, pointsMax <int>, votesFirst <int>
# unanimous Cy Young winners
subset(cyvotes, pointsWon == pointsMax)
#> # A tibble: 0 × 7
#> # Groups:   yearID, lgID [0]
#> # ℹ 7 variables: awardID <chr>, yearID <int>, lgID <fct>, playerID <chr>,
#> #   pointsWon <int>, pointsMax <int>, votesFirst <int>
## CYA was a major league award until 1967
# Find top five pitchers with most top 3 vote tallies in CYA
# head(with(cya_top3, rev(sort(table(playerID)))), 5)
# Pre-1967
cya_top3 %>% 
  filter(yearID <= 1966) %>%
  group_by(playerID) %>%
  summarise(yrs_top3 = n()) %>%
  arrange(desc(yrs_top3)) %>%
  head(., 2)
#> # A tibble: 0 × 2
#> # ℹ 2 variables: playerID <chr>, yrs_top3 <int>
# 1967+ (both leagues)
cya_top3 %>% 
  filter(yearID > 1966) %>%
  group_by(playerID) %>%
  summarise(yrs_top3 = n()) %>%
  arrange(desc(yrs_top3)) %>%
  head(., 5)
#> # A tibble: 0 × 2
#> # ℹ 2 variables: playerID <chr>, yrs_top3 <int>
# 1967+ (by league)
cya_top3 %>% 
  filter(yearID > 1966) %>%
  group_by(playerID, lgID) %>%
  summarise(yrs_top3 = n()) %>%
  arrange(desc(yrs_top3)) %>%
  head(., 5)
#> `summarise()` has grouped output by 'playerID'. You can override using the
#> `.groups` argument.
#> # A tibble: 0 × 3
#> # Groups:   playerID [0]
#> # ℹ 3 variables: playerID <chr>, lgID <fct>, yrs_top3 <int>
# Ditto for MVP awards
# Top 3 votegetters for MVP award by year and league
MVP_top3 <- AwardsSharePlayers %>% 
              filter(awardID == "MVP") %>%
              group_by(yearID, lgID) %>% 
              arrange(desc(pointsWon)) %>%
              do(head(., 3))
tail(MVP_top3)
#> # A tibble: 0 × 7
#> # Groups:   yearID, lgID [0]
#> # ℹ 7 variables: awardID <chr>, yearID <int>, lgID <fct>, playerID <chr>,
#> #   pointsWon <int>, pointsMax <int>, votesFirst <int>
## Select players with >= 7 top 3 finishes
MVP_top3 %>% 
  group_by(playerID) %>%
  summarise(n_top3 = n()) %>%
  arrange(desc(n_top3)) %>%
  filter(n_top3 > 6)
#> # A tibble: 0 × 2
#> # ℹ 2 variables: playerID <chr>, n_top3 <int>