Copied!
                      
                        
                        
                      
                    
                  
                
                
                  %matplotlib inline

                
                %matplotlib inline


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  %matplotlib inline

                
                %matplotlib inline


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  import pandas as pd

                
                import pandas as pd


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  import pandas as pd

                
                import pandas as pd


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  data_dir = os.path.expanduser("~/data/names/names")

                
                
                  data_dir = os.path.expanduser("~/data/names/names")


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  data_dir = os.path.expanduser("~/data/names/names")

                
                
                  data_dir = os.path.expanduser("~/data/names/names")


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  files = os.listdir(data_dir)

                
                files = os.listdir(data_dir)


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  files = os.listdir(data_dir)

                
                files = os.listdir(data_dir)


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  data = pd.DataFrame(columns=["year", "name", "sex", "occurrences"])

                
                
                  data = pd.DataFrame(columns=["year", "name", "sex", "occurrences"])


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  data = pd.DataFrame(columns=["year", "name", "sex", "occurrences"])

                
                
                  data = pd.DataFrame(columns=["year", "name", "sex", "occurrences"])


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  for fname in files:
    if fname.endswith(".txt"):
        fpath = os.path.join(data_dir, fname)
        df = pd.read_csv(fpath, header=None, names=["name", "sex", "occurrences"])
        df["year"] = int(fname[3:7])
        data = data.append(df)

                
                
                  for fname in files: if fname.endswith(".txt"): fpath = os.path.join(data_dir,
                  fname) df = pd.read_csv(fpath, header=None, names=["name", "sex", "occurrences"])
                  df["year"] = int(fname[3:7]) data = data.append(df)


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  for fname in files:
    if fname.endswith(".txt"):
        fpath = os.path.join(data_dir, fname)
        df = pd.read_csv(fpath, header=None, names=["name", "sex", "occurrences"])
        df["year"] = int(fname[3:7])
        data = data.append(df)

                
                
                  for fname in files: if fname.endswith(".txt"): fpath = os.path.join(data_dir,
                  fname) df = pd.read_csv(fpath, header=None, names=["name", "sex", "occurrences"])
                  df["year"] = int(fname[3:7]) data = data.append(df)


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  data.year = data.year.astype(int)

                
                data.year = data.year.astype(int)


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  data.year = data.year.astype(int)

                
                data.year = data.year.astype(int)


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  data.head()

                
                data.head()


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  data.head()

                
                data.head()

(1825433, 4)

(1825433, 4)


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  data.dtypes

                
                data.dtypes

name            object
occurrences    float64
sex             object
year             int64
dtype: object


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  data.dtypes

                
                data.dtypes

name            object
occurrences    float64
sex             object
year             int64
dtype: object


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  beyonce = data[data["name"] == "Beyonce"][["year", "occurrences"]]

                
                
                  beyonce = data[data["name"] == "Beyonce"][["year", "occurrences"]]


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  beyonce = data[data["name"] == "Beyonce"][["year", "occurrences"]]

                
                
                  beyonce = data[data["name"] == "Beyonce"][["year", "occurrences"]]


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  from bokeh.charts import ColumnDataSource, Bar, output_notebook, show

                
                
                  from bokeh.charts import ColumnDataSource, Bar, output_notebook, show


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  from bokeh.charts import ColumnDataSource, Bar, output_notebook, show

                
                
                  from bokeh.charts import ColumnDataSource, Bar, output_notebook, show


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  from bokeh.models import HoverTool

                
                
                  from bokeh.models import HoverTool


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  from bokeh.models import HoverTool

                
                
                  from bokeh.models import HoverTool


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  output_notebook()

                
                output_notebook()


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  output_notebook()

                
                output_notebook()


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  p = Bar(data=beyonce, label="year", values="occurrences", title="No. Babies named Beyoncé",
        color="#0277BD", ylabel='', tools="save,reset")
show(p)

                
                
                  p = Bar(data=beyonce, label="year", values="occurrences", title="No. Babies named
                  Beyoncé", color="#0277BD", ylabel='', tools="save,reset") show(p)


                
                  
                    
                      Copied!
                      
                        
                        
                      
                    
                  
                
                
                  p = Bar(data=beyonce, label="year", values="occurrences", title="No. Babies named Beyoncé",
        color="#0277BD", ylabel='', tools="save,reset")
show(p)

                
                
                  p = Bar(data=beyonce, label="year", values="occurrences", title="No. Babies named
                  Beyoncé", color="#0277BD", ylabel='', tools="save,reset") show(p)

	name	occurrences	sex	year
0	Mary	7065	F	1880
1	Anna	2604	F	1880
2	Emma	2003	F	1880
3	Elizabeth	1939	F	1880
4	Minnie	1746	F	1880

ReproduceIt: Name Trends

Beyonce¶