import pandas as pd
print(pd.__version__)
1.0.3
?pd.read_csv
df = pd.read_csv("./NBAPlayers.txt",sep = '\t')
df.head()
| Player | height | weight | collage | born | birth_city | birth_state |
|---|
| 0 | Curly Armstrong | 180.0 | 77.0 | Indiana University | 1918.0 | NaN | NaN |
|---|
| 1 | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 2 | Leo Barnhorst | 193.0 | 86.0 | University of Notre Dame | 1924.0 | NaN | NaN |
|---|
| 3 | Ed Bartels | 196.0 | 88.0 | North Carolina State University | 1925.0 | NaN | NaN |
|---|
| 4 | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
df['Player']
0 Curly Armstrong
1 Cliff Barker
2 Leo Barnhorst
3 Ed Bartels
4 Ralph Beard
...
3917 Troy Williams
3918 Kyle Wiltjer
3919 Stephen Zimmerman
3920 Paul Zipser
3921 Ivica Zubac
Name: Player, Length: 3922, dtype: object
df.iloc[:,0]
0 Curly Armstrong
1 Cliff Barker
2 Leo Barnhorst
3 Ed Bartels
4 Ralph Beard
...
3917 Troy Williams
3918 Kyle Wiltjer
3919 Stephen Zimmerman
3920 Paul Zipser
3921 Ivica Zubac
Name: Player, Length: 3922, dtype: object
df.loc[:,'Player']
0 Curly Armstrong
1 Cliff Barker
2 Leo Barnhorst
3 Ed Bartels
4 Ralph Beard
...
3917 Troy Williams
3918 Kyle Wiltjer
3919 Stephen Zimmerman
3920 Paul Zipser
3921 Ivica Zubac
Name: Player, Length: 3922, dtype: object
a = {"name":"xiaoming","age":18,"sex":"male"}
pd.Series(a)
name xiaoming
age 18
sex male
dtype: object
[*enumerate(a)]
[(0, 'name'), (1, 'age'), (2, 'sex')]
b = [1,2,3,4,5,6]
s1 = pd.Series(b,index=list('abcdef'))
s1
a 1
b 2
c 3
d 4
e 5
f 6
dtype: int64
s1.values
array([1, 2, 3, 4, 5, 6], dtype=int64)
s1.value_counts()
6 1
5 1
4 1
3 1
2 1
1 1
dtype: int64
b = [[1,2,3,4],['a','b','c','d']]
pd.DataFrame(b)
pd.DataFrame(b, index = list("EF"),columns = list('ABCD'))
a = {"name":"xiaoming","age":18,"sex":"male"}
pd.DataFrame(a,index=list('AB'))
| name | age | sex |
|---|
| A | xiaoming | 18 | male |
|---|
| B | xiaoming | 18 | male |
|---|
df.head()
| Player | height | weight | collage | born | birth_city | birth_state |
|---|
| 0 | Curly Armstrong | 180.0 | 77.0 | Indiana University | 1918.0 | NaN | NaN |
|---|
| 1 | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 2 | Leo Barnhorst | 193.0 | 86.0 | University of Notre Dame | 1924.0 | NaN | NaN |
|---|
| 3 | Ed Bartels | 196.0 | 88.0 | North Carolina State University | 1925.0 | NaN | NaN |
|---|
| 4 | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
df.rename(columns={'height':'Height','collage':'Collage','birth_city':'Birth_city'},inplace=True)
df.head()
| Player | Height | weight | Collage | born | Birth_city | birth_state |
|---|
| 0 | Curly Armstrong | 180.0 | 77.0 | Indiana University | 1918.0 | NaN | NaN |
|---|
| 1 | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 2 | Leo Barnhorst | 193.0 | 86.0 | University of Notre Dame | 1924.0 | NaN | NaN |
|---|
| 3 | Ed Bartels | 196.0 | 88.0 | North Carolina State University | 1925.0 | NaN | NaN |
|---|
| 4 | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
df.sort_values(by =['Collage','Height'])
| Player | Height | weight | Collage | born | Birth_city | birth_state |
|---|
| 803 | Brian Heaney | 188.0 | 81.0 | Acadia University | 1946.0 | NaN | NaN |
|---|
| 3468 | Mickell Gladness | 211.0 | 99.0 | Alabama A&M University | 1986.0 | Birmingham | Alabama |
|---|
| 1501 | Kevin Loder | 198.0 | 92.0 | Alabama State University | 1959.0 | Cassopolis | Michigan |
|---|
| 1368 | Major Jones | 206.0 | 102.0 | Albany State University | 1953.0 | McGhee | Arkansas |
|---|
| 1613 | Charles Jones | 206.0 | 97.0 | Albany State University | 1957.0 | McGehee | Arkansas |
|---|
| ... | ... | ... | ... | ... | ... | ... | ... |
|---|
| 3018 | Peter John | 226.0 | 117.0 | NaN | 1985.0 | NaN | NaN |
|---|
| 2249 | P.J. Brown | 229.0 | 106.0 | NaN | 1972.0 | NaN | NaN |
|---|
| 2878 | Yao Ming* | 229.0 | 140.0 | NaN | 1980.0 | Shanghai | China |
|---|
| 2297 | Gheorghe Muresan | 231.0 | 137.0 | NaN | 1971.0 | Triteni | Romania |
|---|
| 223 | NaN | NaN | NaN | NaN | NaN | NaN | NaN |
|---|
3922 rows × 7 columns
df.replace({'Player':{'Curly Armstrong':'xiaozhao'}})
| Player | Height | weight | Collage | born | Birth_city | birth_state |
|---|
| 0 | xiaozhao | 180.0 | 77.0 | Indiana University | 1918.0 | NaN | NaN |
|---|
| 1 | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 2 | Leo Barnhorst | 193.0 | 86.0 | University of Notre Dame | 1924.0 | NaN | NaN |
|---|
| 3 | Ed Bartels | 196.0 | 88.0 | North Carolina State University | 1925.0 | NaN | NaN |
|---|
| 4 | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
| ... | ... | ... | ... | ... | ... | ... | ... |
|---|
| 3917 | Troy Williams | 198.0 | 97.0 | South Carolina State University | 1969.0 | Columbia | South Carolina |
|---|
| 3918 | Kyle Wiltjer | 208.0 | 108.0 | Gonzaga University | 1992.0 | Portland | Oregon |
|---|
| 3919 | Stephen Zimmerman | 213.0 | 108.0 | University of Nevada, Las Vegas | 1996.0 | Hendersonville | Tennessee |
|---|
| 3920 | Paul Zipser | 203.0 | 97.0 | NaN | 1994.0 | Heidelberg | Germany |
|---|
| 3921 | Ivica Zubac | 216.0 | 120.0 | NaN | 1997.0 | Mostar | Bosnia and Herzegovina |
|---|
3922 rows × 7 columns
df.min()
Height 160.0
weight 60.0
born 1913.0
dtype: float64
import numpy as np
pd.value_counts(df['born'])
1970.0 84
1964.0 77
1955.0 76
1968.0 74
1984.0 73
..
1917.0 6
1918.0 5
1915.0 2
1914.0 1
1913.0 1
Name: born, Length: 84, dtype: int64
df.sum(axis = 0)
Height 779122.0
weight 371645.0
born 7694491.0
dtype: float64
a = np.array([[1,2,3,4,5,56],[3,4,5,1,7,3],[29,3,1,6,2,0]])
a.sum()
135
a.sum(axis=1)
array([71, 23, 41])
a.sum(axis=0)
array([33, 9, 9, 11, 14, 59])
pd.isnull(df['Player'])
0 False
1 False
2 False
3 False
4 False
...
3917 False
3918 False
3919 False
3920 False
3921 False
Name: Player, Length: 3922, dtype: bool
df.dropna(axis=0, how='any', thresh=None, subset=None, inplace=False)
| Player | Height | weight | Collage | born | Birth_city | birth_state |
|---|
| 1 | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 4 | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
| 6 | Charlie Black | 196.0 | 90.0 | University of Kansas | 1921.0 | Arco | Idaho |
|---|
| 7 | Nelson Bobb | 183.0 | 77.0 | Temple University | 1924.0 | Philadelphia | Pennsylvania |
|---|
| 8 | Jake Bornheimer | 196.0 | 90.0 | Muhlenberg College | 1927.0 | New Brunswick | New Jersey |
|---|
| ... | ... | ... | ... | ... | ... | ... | ... |
|---|
| 3915 | Okaro White | 203.0 | 92.0 | Florida State University | 1992.0 | Clearwater | Florida |
|---|
| 3916 | Isaiah Whitehead | 193.0 | 96.0 | Seton Hall University | 1995.0 | Brooklyn | New York |
|---|
| 3917 | Troy Williams | 198.0 | 97.0 | South Carolina State University | 1969.0 | Columbia | South Carolina |
|---|
| 3918 | Kyle Wiltjer | 208.0 | 108.0 | Gonzaga University | 1992.0 | Portland | Oregon |
|---|
| 3919 | Stephen Zimmerman | 213.0 | 108.0 | University of Nevada, Las Vegas | 1996.0 | Hendersonville | Tennessee |
|---|
3189 rows × 7 columns
df.fillna(value=0, method=None, axis=None, inplace=False, limit=None, downcast=None)
| Player | Height | weight | Collage | born | Birth_city | birth_state |
|---|
| 0 | Curly Armstrong | 180.0 | 77.0 | Indiana University | 1918.0 | 0 | 0 |
|---|
| 1 | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 2 | Leo Barnhorst | 193.0 | 86.0 | University of Notre Dame | 1924.0 | 0 | 0 |
|---|
| 3 | Ed Bartels | 196.0 | 88.0 | North Carolina State University | 1925.0 | 0 | 0 |
|---|
| 4 | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
| ... | ... | ... | ... | ... | ... | ... | ... |
|---|
| 3917 | Troy Williams | 198.0 | 97.0 | South Carolina State University | 1969.0 | Columbia | South Carolina |
|---|
| 3918 | Kyle Wiltjer | 208.0 | 108.0 | Gonzaga University | 1992.0 | Portland | Oregon |
|---|
| 3919 | Stephen Zimmerman | 213.0 | 108.0 | University of Nevada, Las Vegas | 1996.0 | Hendersonville | Tennessee |
|---|
| 3920 | Paul Zipser | 203.0 | 97.0 | 0 | 1994.0 | Heidelberg | Germany |
|---|
| 3921 | Ivica Zubac | 216.0 | 120.0 | 0 | 1997.0 | Mostar | Bosnia and Herzegovina |
|---|
3922 rows × 7 columns
s = pd.Series(['A', 'B', 'C', 'Aaba ', ' Baca', 'CABA ', 'dog', 'cat'])
s.str.strip()
0 A
1 B
2 C
3 Aaba
4 Baca
5 CABA
6 dog
7 cat
dtype: object
s.str.upper()
0 A
1 B
2 C
3 AABA
4 BACA
5 CABA
6 DOG
7 CAT
dtype: object
s[s.str.strip().str.endswith("a")]
3 Aaba
4 Baca
dtype: object
df.loc[df['Height']>=180]
| Player | Height | weight | Collage | born | Birth_city | birth_state |
|---|
| 0 | Curly Armstrong | 180.0 | 77.0 | Indiana University | 1918.0 | NaN | NaN |
|---|
| 1 | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 2 | Leo Barnhorst | 193.0 | 86.0 | University of Notre Dame | 1924.0 | NaN | NaN |
|---|
| 3 | Ed Bartels | 196.0 | 88.0 | North Carolina State University | 1925.0 | NaN | NaN |
|---|
| 5 | Gene Berce | 180.0 | 79.0 | Marquette University | 1926.0 | NaN | NaN |
|---|
| ... | ... | ... | ... | ... | ... | ... | ... |
|---|
| 3917 | Troy Williams | 198.0 | 97.0 | South Carolina State University | 1969.0 | Columbia | South Carolina |
|---|
| 3918 | Kyle Wiltjer | 208.0 | 108.0 | Gonzaga University | 1992.0 | Portland | Oregon |
|---|
| 3919 | Stephen Zimmerman | 213.0 | 108.0 | University of Nevada, Las Vegas | 1996.0 | Hendersonville | Tennessee |
|---|
| 3920 | Paul Zipser | 203.0 | 97.0 | NaN | 1994.0 | Heidelberg | Germany |
|---|
| 3921 | Ivica Zubac | 216.0 | 120.0 | NaN | 1997.0 | Mostar | Bosnia and Herzegovina |
|---|
3869 rows × 7 columns
df.loc[:,['Player','Collage','Birth_city']]
| Player | Collage | Birth_city |
|---|
| 0 | Curly Armstrong | Indiana University | NaN |
|---|
| 1 | Cliff Barker | University of Kentucky | Yorktown |
|---|
| 2 | Leo Barnhorst | University of Notre Dame | NaN |
|---|
| 3 | Ed Bartels | North Carolina State University | NaN |
|---|
| 4 | Ralph Beard | University of Kentucky | Hardinsburg |
|---|
| ... | ... | ... | ... |
|---|
| 3917 | Troy Williams | South Carolina State University | Columbia |
|---|
| 3918 | Kyle Wiltjer | Gonzaga University | Portland |
|---|
| 3919 | Stephen Zimmerman | University of Nevada, Las Vegas | Hendersonville |
|---|
| 3920 | Paul Zipser | NaN | Heidelberg |
|---|
| 3921 | Ivica Zubac | NaN | Mostar |
|---|
3922 rows × 3 columns
df.loc[(df['Height']>=180) & (df['weight']>=80)]
| Player | Height | weight | Collage | born | Birth_city | birth_state |
|---|
| 1 | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 2 | Leo Barnhorst | 193.0 | 86.0 | University of Notre Dame | 1924.0 | NaN | NaN |
|---|
| 3 | Ed Bartels | 196.0 | 88.0 | North Carolina State University | 1925.0 | NaN | NaN |
|---|
| 6 | Charlie Black | 196.0 | 90.0 | University of Kansas | 1921.0 | Arco | Idaho |
|---|
| 8 | Jake Bornheimer | 196.0 | 90.0 | Muhlenberg College | 1927.0 | New Brunswick | New Jersey |
|---|
| ... | ... | ... | ... | ... | ... | ... | ... |
|---|
| 3917 | Troy Williams | 198.0 | 97.0 | South Carolina State University | 1969.0 | Columbia | South Carolina |
|---|
| 3918 | Kyle Wiltjer | 208.0 | 108.0 | Gonzaga University | 1992.0 | Portland | Oregon |
|---|
| 3919 | Stephen Zimmerman | 213.0 | 108.0 | University of Nevada, Las Vegas | 1996.0 | Hendersonville | Tennessee |
|---|
| 3920 | Paul Zipser | 203.0 | 97.0 | NaN | 1994.0 | Heidelberg | Germany |
|---|
| 3921 | Ivica Zubac | 216.0 | 120.0 | NaN | 1997.0 | Mostar | Bosnia and Herzegovina |
|---|
3543 rows × 7 columns
df = pd.read_csv("movie.csv")
df.head()
| color | director_name | num_critic_for_reviews | duration | director_facebook_likes | actor_3_facebook_likes | actor_2_name | actor_1_facebook_likes | gross | genres | ... | num_user_for_reviews | language | country | content_rating | budget | title_year | actor_2_facebook_likes | imdb_score | aspect_ratio | movie_facebook_likes |
|---|
| 0 | Color | James Cameron | 723.0 | 178.0 | 0.0 | 855.0 | Joel David Moore | 1000.0 | 760505847.0 | Action|Adventure|Fantasy|Sci-Fi | ... | 3054.0 | English | USA | PG-13 | 237000000.0 | 2009.0 | 936.0 | 7.9 | 1.78 | 33000 |
|---|
| 1 | Color | Gore Verbinski | 302.0 | 169.0 | 563.0 | 1000.0 | Orlando Bloom | 40000.0 | 309404152.0 | Action|Adventure|Fantasy | ... | 1238.0 | English | USA | PG-13 | 300000000.0 | 2007.0 | 5000.0 | 7.1 | 2.35 | 0 |
|---|
| 2 | Color | Sam Mendes | 602.0 | 148.0 | 0.0 | 161.0 | Rory Kinnear | 11000.0 | 200074175.0 | Action|Adventure|Thriller | ... | 994.0 | English | UK | PG-13 | 245000000.0 | 2015.0 | 393.0 | 6.8 | 2.35 | 85000 |
|---|
| 3 | Color | Christopher Nolan | 813.0 | 164.0 | 22000.0 | 23000.0 | Christian Bale | 27000.0 | 448130642.0 | Action|Thriller | ... | 2701.0 | English | USA | PG-13 | 250000000.0 | 2012.0 | 23000.0 | 8.5 | 2.35 | 164000 |
|---|
| 4 | NaN | Doug Walker | NaN | NaN | 131.0 | NaN | Rob Walker | 131.0 | NaN | Documentary | ... | NaN | NaN | NaN | NaN | NaN | NaN | 12.0 | 7.1 | NaN | 0 |
|---|
5 rows × 28 columns
df.head()
| color | director_name | num_critic_for_reviews | duration | director_facebook_likes | actor_3_facebook_likes | actor_2_name | actor_1_facebook_likes | gross | genres | ... | num_user_for_reviews | language | country | content_rating | budget | title_year | actor_2_facebook_likes | imdb_score | aspect_ratio | movie_facebook_likes |
|---|
| 0 | Color | James Cameron | 723.0 | 178.0 | 0.0 | 855.0 | Joel David Moore | 1000.0 | 760505847.0 | Action|Adventure|Fantasy|Sci-Fi | ... | 3054.0 | English | USA | PG-13 | 237000000.0 | 2009.0 | 936.0 | 7.9 | 1.78 | 33000 |
|---|
| 1 | Color | Gore Verbinski | 302.0 | 169.0 | 563.0 | 1000.0 | Orlando Bloom | 40000.0 | 309404152.0 | Action|Adventure|Fantasy | ... | 1238.0 | English | USA | PG-13 | 300000000.0 | 2007.0 | 5000.0 | 7.1 | 2.35 | 0 |
|---|
| 2 | Color | Sam Mendes | 602.0 | 148.0 | 0.0 | 161.0 | Rory Kinnear | 11000.0 | 200074175.0 | Action|Adventure|Thriller | ... | 994.0 | English | UK | PG-13 | 245000000.0 | 2015.0 | 393.0 | 6.8 | 2.35 | 85000 |
|---|
| 3 | Color | Christopher Nolan | 813.0 | 164.0 | 22000.0 | 23000.0 | Christian Bale | 27000.0 | 448130642.0 | Action|Thriller | ... | 2701.0 | English | USA | PG-13 | 250000000.0 | 2012.0 | 23000.0 | 8.5 | 2.35 | 164000 |
|---|
| 4 | NaN | Doug Walker | NaN | NaN | 131.0 | NaN | Rob Walker | 131.0 | NaN | Documentary | ... | NaN | NaN | NaN | NaN | NaN | NaN | 12.0 | 7.1 | NaN | 0 |
|---|
5 rows × 28 columns
df = pd.read_csv("./NBAPlayers.txt",sep = '\t')
df.head()
| Player | height | weight | collage | born | birth_city | birth_state |
|---|
| 0 | Curly Armstrong | 180.0 | 77.0 | Indiana University | 1918.0 | NaN | NaN |
|---|
| 1 | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 2 | Leo Barnhorst | 193.0 | 86.0 | University of Notre Dame | 1924.0 | NaN | NaN |
|---|
| 3 | Ed Bartels | 196.0 | 88.0 | North Carolina State University | 1925.0 | NaN | NaN |
|---|
| 4 | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
new_df = df.set_index(keys=['birth_city','birth_state'],append=True,drop = False)
new_df.head()
| | | Player | height | weight | collage | born | birth_city | birth_state |
|---|
| birth_city | birth_state | | | | | | | |
|---|
| 0 | NaN | NaN | Curly Armstrong | 180.0 | 77.0 | Indiana University | 1918.0 | NaN | NaN |
|---|
| 1 | Yorktown | Indiana | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 2 | NaN | NaN | Leo Barnhorst | 193.0 | 86.0 | University of Notre Dame | 1924.0 | NaN | NaN |
|---|
| 3 | NaN | NaN | Ed Bartels | 196.0 | 88.0 | North Carolina State University | 1925.0 | NaN | NaN |
|---|
| 4 | Hardinsburg | Kentucky | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
new_df.sort_index(na_position="last",inplace=True)
new_df
| | | Player | height | weight | collage | born | birth_city | birth_state |
|---|
| birth_city | birth_state | | | | | | | |
|---|
| 0 | NaN | NaN | Curly Armstrong | 180.0 | 77.0 | Indiana University | 1918.0 | NaN | NaN |
|---|
| 1 | Yorktown | Indiana | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 2 | NaN | NaN | Leo Barnhorst | 193.0 | 86.0 | University of Notre Dame | 1924.0 | NaN | NaN |
|---|
| 3 | NaN | NaN | Ed Bartels | 196.0 | 88.0 | North Carolina State University | 1925.0 | NaN | NaN |
|---|
| 4 | Hardinsburg | Kentucky | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
| ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
|---|
| 3917 | Columbia | South Carolina | Troy Williams | 198.0 | 97.0 | South Carolina State University | 1969.0 | Columbia | South Carolina |
|---|
| 3918 | Portland | Oregon | Kyle Wiltjer | 208.0 | 108.0 | Gonzaga University | 1992.0 | Portland | Oregon |
|---|
| 3919 | Hendersonville | Tennessee | Stephen Zimmerman | 213.0 | 108.0 | University of Nevada, Las Vegas | 1996.0 | Hendersonville | Tennessee |
|---|
| 3920 | Heidelberg | Germany | Paul Zipser | 203.0 | 97.0 | NaN | 1994.0 | Heidelberg | Germany |
|---|
| 3921 | Mostar | Bosnia and Herzegovina | Ivica Zubac | 216.0 | 120.0 | NaN | 1997.0 | Mostar | Bosnia and Herzegovina |
|---|
3922 rows × 7 columns
new_df.loc[(slice(None),['Akron','Ahvaz','Albany'],slice(None)),:]
| | | Player | height | weight | collage | born | birth_city | birth_state |
|---|
| birth_city | birth_state | | | | | | | |
|---|
| 71 | Albany | Texas | Chick Halbert | 206.0 | 102.0 | West Texas A&M University | 1919.0 | Albany | Texas |
|---|
| 539 | Akron | Ohio | Jimmy Darrow | 178.0 | 77.0 | Bowling Green State University | 1937.0 | Akron | Ohio |
|---|
| 609 | Akron | Ohio | Gus Johnson* | 198.0 | 104.0 | University of Idaho | 1938.0 | Akron | Ohio |
|---|
| 620 | Akron | Ohio | Nate Thurmond* | 211.0 | 102.0 | Bowling Green State University | 1941.0 | Akron | Ohio |
|---|
| 1028 | Albany | Georgia | Ben Clyde | 201.0 | 89.0 | Florida State University | 1951.0 | Albany | Georgia |
|---|
| 1927 | Akron | Ohio | Jerome Lane | 198.0 | 104.0 | University of Pittsburgh | 1966.0 | Akron | Ohio |
|---|
| 2374 | Albany | Georgia | Dontonio Wingfield | 203.0 | 116.0 | University of Cincinnati | 1974.0 | Albany | Georgia |
|---|
| 2756 | Albany | Georgia | Lavor Postell | 196.0 | 97.0 | St. John's University | 1978.0 | Albany | Georgia |
|---|
| 2882 | Akron | Ohio | Chris Owens | 201.0 | 111.0 | University of Texas at Austin | 1979.0 | Akron | Ohio |
|---|
| 2944 | Akron | Ohio | LeBron James | 203.0 | 113.0 | NaN | 1984.0 | Akron | Ohio |
|---|
| 2985 | Albany | New York | Lionel Chalmers | 183.0 | 81.0 | Xavier University | 1980.0 | Albany | New York |
|---|
| 3163 | Albany | Georgia | Alexander Johnson | 206.0 | 108.0 | Florida State University | 1983.0 | Albany | Georgia |
|---|
| 3287 | Ahvaz | Islamic Republic of Iran | Hamed Haddadi | 218.0 | 115.0 | NaN | 1985.0 | Ahvaz | Islamic Republic of Iran |
|---|
| 3343 | Akron | Ohio | Stephen Curry | 190.0 | 86.0 | Davidson College | 1988.0 | Akron | Ohio |
|---|
new_df.loc[idx[0:500,:],:]
| | | Player | height | weight | collage | born | birth_city | birth_state |
|---|
| birth_city | birth_state | | | | | | | |
|---|
| 0 | NaN | NaN | Curly Armstrong | 180.0 | 77.0 | Indiana University | 1918.0 | NaN | NaN |
|---|
| 1 | Yorktown | Indiana | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 2 | NaN | NaN | Leo Barnhorst | 193.0 | 86.0 | University of Notre Dame | 1924.0 | NaN | NaN |
|---|
| 3 | NaN | NaN | Ed Bartels | 196.0 | 88.0 | North Carolina State University | 1925.0 | NaN | NaN |
|---|
| 4 | Hardinsburg | Kentucky | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
| ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
|---|
| 496 | Dayton | Ohio | Johnny Green | 196.0 | 90.0 | Michigan State University | 1933.0 | Dayton | Ohio |
|---|
| 497 | Duryea | Pennsylvania | Gene Guarilia | 196.0 | 99.0 | George Washington University | 1937.0 | Duryea | Pennsylvania |
|---|
| 498 | Chicago | Illinois | Tom Hawkins | 196.0 | 95.0 | University of Notre Dame | 1936.0 | Chicago | Illinois |
|---|
| 499 | Middleton | Tennessee | Bailey Howell* | 201.0 | 95.0 | Mississippi State University | 1937.0 | Middleton | Tennessee |
|---|
| 500 | NaN | NaN | Maury King | 188.0 | 88.0 | University of Kansas | 1935.0 | NaN | NaN |
|---|
501 rows × 7 columns
new_df_1 = df.loc[:,['birth_city',"birth_state",'collage']]
new_df_1
| birth_city | birth_state | collage |
|---|
| 0 | NaN | NaN | Indiana University |
|---|
| 1 | Yorktown | Indiana | University of Kentucky |
|---|
| 2 | NaN | NaN | University of Notre Dame |
|---|
| 3 | NaN | NaN | North Carolina State University |
|---|
| 4 | Hardinsburg | Kentucky | University of Kentucky |
|---|
| ... | ... | ... | ... |
|---|
| 3917 | Columbia | South Carolina | South Carolina State University |
|---|
| 3918 | Portland | Oregon | Gonzaga University |
|---|
| 3919 | Hendersonville | Tennessee | University of Nevada, Las Vegas |
|---|
| 3920 | Heidelberg | Germany | NaN |
|---|
| 3921 | Mostar | Bosnia and Herzegovina | NaN |
|---|
3922 rows × 3 columns
df_1 = df.set_index(keys=['birth_city','birth_state'],append=True,drop = False)
df_1.loc[idx[0:200,["Yorktown","Hardinsburg"]],:]
| | | Player | height | weight | collage | born | birth_city | birth_state |
|---|
| birth_city | birth_state | | | | | | | |
|---|
| 1 | Yorktown | Indiana | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 4 | Hardinsburg | Kentucky | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
| 154 | Yorktown | Indiana | Jack Parkinson | 183.0 | 78.0 | University of Kentucky | 1924.0 | Yorktown | Indiana |
|---|
df_2 = df_1.loc[idx[0:200,["Yorktown","Hardinsburg"]],:]
df_2
| | | Player | height | weight | collage | born | birth_city | birth_state |
|---|
| birth_city | birth_state | | | | | | | |
|---|
| 1 | Yorktown | Indiana | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 4 | Hardinsburg | Kentucky | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
| 154 | Yorktown | Indiana | Jack Parkinson | 183.0 | 78.0 | University of Kentucky | 1924.0 | Yorktown | Indiana |
|---|
df_3 = df_2.loc[:,['Player','collage']]
df_1 = df.set_index(keys=['birth_city','birth_state'],append=True,drop = False)
new_df.loc[idx[0:500,['Yorktown'],[]],:]
| | | Player | height | weight | collage | born | birth_city | birth_state |
|---|
| birth_city | birth_state | | | | | | | |
|---|
new_df.loc[idx[0:500,['Yorktown'],[]],:]
| | | Player | height | weight | collage | born | birth_city | birth_state |
|---|
| birth_city | birth_state | | | | | | | |
|---|
| 1 | Yorktown | Indiana | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 154 | Yorktown | Indiana | Jack Parkinson | 183.0 | 78.0 | University of Kentucky | 1924.0 | Yorktown | Indiana |
|---|
idx = pd.IndexSlice
new_df.loc[idx[0:20,['Brooklyn'],['Ohio','New York']],:idx["Player"]]
| | | Player |
|---|
| birth_city | birth_state | |
|---|
| 11 | Brooklyn | New York | Harry Boykoff |
|---|
| 14 | Brooklyn | New York | Carl Braun |
|---|
new_df.loc[idx[0:200,['Hardinsburg']],:]
| | | Player | height | weight | collage | born | birth_city | birth_state |
|---|
| birth_city | birth_state | | | | | | | |
|---|
| 4 | Hardinsburg | Kentucky | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
df[0:21]
np.concatenate()
| Player | height | weight | collage | born | birth_city | birth_state |
|---|
| 0 | Curly Armstrong | 180.0 | 77.0 | Indiana University | 1918.0 | NaN | NaN |
|---|
| 1 | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 2 | Leo Barnhorst | 193.0 | 86.0 | University of Notre Dame | 1924.0 | NaN | NaN |
|---|
| 3 | Ed Bartels | 196.0 | 88.0 | North Carolina State University | 1925.0 | NaN | NaN |
|---|
| 4 | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
| 5 | Gene Berce | 180.0 | 79.0 | Marquette University | 1926.0 | NaN | NaN |
|---|
| 6 | Charlie Black | 196.0 | 90.0 | University of Kansas | 1921.0 | Arco | Idaho |
|---|
| 7 | Nelson Bobb | 183.0 | 77.0 | Temple University | 1924.0 | Philadelphia | Pennsylvania |
|---|
| 8 | Jake Bornheimer | 196.0 | 90.0 | Muhlenberg College | 1927.0 | New Brunswick | New Jersey |
|---|
| 9 | Vince Boryla | 196.0 | 95.0 | University of Denver | 1927.0 | East Chicago | Indiana |
|---|
| 10 | Don Boven | 193.0 | 95.0 | Western Michigan University | 1925.0 | Kalamazoo | Michigan |
|---|
| 11 | Harry Boykoff | 208.0 | 102.0 | St. John's University | 1922.0 | Brooklyn | New York |
|---|
| 12 | Joe Bradley | 190.0 | 79.0 | Oklahoma State University | 1928.0 | Washington | Oklahoma |
|---|
| 13 | Bob Brannum | 196.0 | 97.0 | Michigan State University | 1925.0 | NaN | NaN |
|---|
| 14 | Carl Braun | 196.0 | 81.0 | Colgate University | 1927.0 | Brooklyn | New York |
|---|
| 15 | Frankie Brian | 185.0 | 81.0 | Louisiana State University | 1923.0 | Zachary | Louisiana |
|---|
| 16 | Price Brookfield | 193.0 | 83.0 | West Texas A&M University | 1920.0 | Floydada | Texas |
|---|
| 17 | Bob Brown | 193.0 | 92.0 | Miami University | 1923.0 | Versailles | Ohio |
|---|
| 18 | Jim Browne | 208.0 | 106.0 | NaN | 1930.0 | Midlothian | Illinois |
|---|
| 19 | Walt Budko | 196.0 | 99.0 | Columbia University | 1925.0 | Kearney | New Jersey |
|---|
| 20 | Jack Burmaster | 190.0 | 86.0 | University of Illinois at Urbana-Champaign | 1926.0 | NaN | NaN |
|---|
pd.read_csv("./NBAPlayers.txt",sep='\t',header=None)
| 0 | 1 | 2 | 3 | 4 | 5 | 6 |
|---|
| 0 | Player | height | weight | collage | born | birth_city | birth_state |
|---|
| 1 | Curly Armstrong | 180 | 77 | Indiana University | 1918 | NaN | NaN |
|---|
| 2 | Cliff Barker | 188 | 83 | University of Kentucky | 1921 | Yorktown | Indiana |
|---|
| 3 | Leo Barnhorst | 193 | 86 | University of Notre Dame | 1924 | NaN | NaN |
|---|
| 4 | Ed Bartels | 196 | 88 | North Carolina State University | 1925 | NaN | NaN |
|---|
| ... | ... | ... | ... | ... | ... | ... | ... |
|---|
| 3918 | Troy Williams | 198 | 97 | South Carolina State University | 1969 | Columbia | South Carolina |
|---|
| 3919 | Kyle Wiltjer | 208 | 108 | Gonzaga University | 1992 | Portland | Oregon |
|---|
| 3920 | Stephen Zimmerman | 213 | 108 | University of Nevada, Las Vegas | 1996 | Hendersonville | Tennessee |
|---|
| 3921 | Paul Zipser | 203 | 97 | NaN | 1994 | Heidelberg | Germany |
|---|
| 3922 | Ivica Zubac | 216 | 120 | NaN | 1997 | Mostar | Bosnia and Herzegovina |
|---|
3923 rows × 7 columns
df = pd.DataFrame({ 'A': ['A0', 'A1', 'A2', 'A3'],
'B': ['B0', 'B1', 'B2', 'B3'],
'C': ['C0', 'C1', 'C2', 'C3'],
'D': ['D0', 'D1', 'D2', 'D3']})
drop_t = df.set_index('A',drop=True, append=False, inplace=False, verify_integrity=False)
drop_t
| B | C | D |
|---|
| A | | | |
|---|
| A0 | B0 | C0 | D0 |
|---|
| A1 | B1 | C1 | D1 |
|---|
| A2 | B2 | C2 | D2 |
|---|
| A3 | B3 | C3 | D3 |
|---|
no_drop_t = df.set_index('A',drop=False, append=False, inplace=False, verify_integrity=False)
no_drop_t
| A | B | C | D |
|---|
| A | | | | |
|---|
| A0 | A0 | B0 | C0 | D0 |
|---|
| A1 | A1 | B1 | C1 | D1 |
|---|
| A2 | A2 | B2 | C2 | D2 |
|---|
| A3 | A3 | B3 | C3 | D3 |
|---|
reset_drop_t = drop_t.reset_index(drop=False)
reset_drop_t
| A | B | C | D |
|---|
| 0 | A0 | B0 | C0 | D0 |
|---|
| 1 | A1 | B1 | C1 | D1 |
|---|
| 2 | A2 | B2 | C2 | D2 |
|---|
| 3 | A3 | B3 | C3 | D3 |
|---|
df_1 = df.reset_index(drop=False)
df_1
| index | Player | height | weight | collage | born | birth_city | birth_state |
|---|
| 0 | 0 | Curly Armstrong | 180.0 | 77.0 | Indiana University | 1918.0 | NaN | NaN |
|---|
| 1 | 1 | Cliff Barker | 188.0 | 83.0 | University of Kentucky | 1921.0 | Yorktown | Indiana |
|---|
| 2 | 2 | Leo Barnhorst | 193.0 | 86.0 | University of Notre Dame | 1924.0 | NaN | NaN |
|---|
| 3 | 3 | Ed Bartels | 196.0 | 88.0 | North Carolina State University | 1925.0 | NaN | NaN |
|---|
| 4 | 4 | Ralph Beard | 178.0 | 79.0 | University of Kentucky | 1927.0 | Hardinsburg | Kentucky |
|---|
| ... | ... | ... | ... | ... | ... | ... | ... | ... |
|---|
| 3917 | 3917 | Troy Williams | 198.0 | 97.0 | South Carolina State University | 1969.0 | Columbia | South Carolina |
|---|
| 3918 | 3918 | Kyle Wiltjer | 208.0 | 108.0 | Gonzaga University | 1992.0 | Portland | Oregon |
|---|
| 3919 | 3919 | Stephen Zimmerman | 213.0 | 108.0 | University of Nevada, Las Vegas | 1996.0 | Hendersonville | Tennessee |
|---|
| 3920 | 3920 | Paul Zipser | 203.0 | 97.0 | NaN | 1994.0 | Heidelberg | Germany |
|---|
| 3921 | 3921 | Ivica Zubac | 216.0 | 120.0 | NaN | 1997.0 | Mostar | Bosnia and Herzegovina |
|---|
3922 rows × 8 columns