import pandas
import numpy

print(pandas.DataFrame)

<class 'pandas.core.frame.DataFrame'>

empty_dataframe = pandas.DataFrame()
print(type(empty_dataframe))

<class 'pandas.core.frame.DataFrame'>

temporary_dict = {
    "Date": ["2023-05-01", "2023-05-02", "2023-05-03", "2023-05-04", "2023-05-05"],
    "Latitude": [34.05, 37.77, 40.71, 34.05, 35.68],
    "Longitude": [-118.25, -122.42, -74.01, -118.25, 139.69],
    "Magnitude": [4.1, 3.8, 5.2, 4.0, 6.1],
    "Depth (km)": [2.0, 12.5, 8.0, 15.0, 20.0],
    "Region": ["City1", "City2", "City3", "City4", "City5"]
}
df_from_lists = pandas.DataFrame(temporary_dict)
print(df_from_lists)

         Date  Latitude  Longitude  Magnitude  Depth (km) Region
0  2023-05-01     34.05    -118.25        4.1         2.0  City1
1  2023-05-02     37.77    -122.42        3.8        12.5  City2
2  2023-05-03     40.71     -74.01        5.2         8.0  City3
3  2023-05-04     34.05    -118.25        4.0        15.0  City4
4  2023-05-05     35.68     139.69        6.1        20.0  City5

#your code here

dict_1 = {
  "Date": "2023-05-01",
  "Latitude": 34.05,
  "Longitude": -118.25,
  "Magnitude": 4.5,
  "Depth (km)": 10.0,
  "Region": "City1"
}

dict_2 = {
  "Date": "2023-05-02",
  "Latitude": 37.77,
  "Longitude": -122.42,
  "Magnitude": 3.8,
  "Depth (km)": 12.5,
  "Region": "City2"
}

temporary_list = [dict_1, dict_2]

df_from_dicts = pandas.DataFrame(temporary_list)

print(df_from_dicts)

         Date  Latitude  Longitude  Magnitude  Depth (km) Region
0  2023-05-01     34.05    -118.25        4.5        10.0  City1
1  2023-05-02     37.77    -122.42        3.8        12.5  City2

#your code here

# a quick 3x4 array
data_2d = numpy.arange(12).reshape(3, 4)

df_from_array = pandas.DataFrame(data=data_2d,
                                 index=["row1", "row2", "row3"],
                                 columns=["column1", "column2", "column3", "column4"]
                                 )
print(df_from_array)

      column1  column2  column3  column4
row1        0        1        2        3
row2        4        5        6        7
row3        8        9       10       11

#your code here

df_from_file = pandas.read_csv('example_spreadsheet.csv')
print(df_from_file)

     Date  Latitude  Longitude  Magnitude  Depth (km) Region
0  5/1/23     34.05    -118.25        4.5        10.0  City1
1  5/2/23     37.77    -122.42        3.8        12.5  City2
2  5/3/23     40.71     -74.01        5.2         8.0  City3
3  5/4/23     34.05    -118.25        4.0        15.0  City4
4  5/5/23     35.68     139.69        6.1        20.0  City5

#your code here

temporary_dict = {
    "Date": ["2023-05-01", "2023-05-02", "2023-05-03", "2023-05-04", "2023-05-05"],
    "Latitude": [34.05, 37.77, 40.71, 34.05, 35.68],
    "Longitude": [-118.25, -122.42, -74.01, -118.25, 139.69],
    "Magnitude": [4.5, 3.8, 5.2, 4.0, 6.1],
    "Depth (km)": [10.0, 12.5, 8.0, 15.0, 20.0],
    "Region": ["City1", "City2", "City3", "City4", "City5"]
}
df_from_lists = pandas.DataFrame(temporary_dict)
df_from_lists.to_csv("example_spreadsheet_2.csv")

#your code here

temporary_dict = {
    "Date": ["2023-05-01", "2023-05-02", "2023-05-03", "2023-05-04", "2023-05-05"],
    "Latitude": [34.05, 37.77, 40.71, 34.05, 35.68],
    "Longitude": [-118.25, -122.42, -74.01, -118.25, 139.69],
    "Magnitude": [4.5, 3.8, 5.2, 4.0, 6.1],
    "Depth (km)": [10.0, 12.5, 8.0, 15.0, 20.0],
    "Region": ["City1", "City2", "City3", "City4", "City5"]
}

df_from_lists = pandas.DataFrame(temporary_dict, columns=["Date","Magnitude","Region"])

print(df_from_lists)

         Date  Magnitude Region
0  2023-05-01        4.5  City1
1  2023-05-02        3.8  City2
2  2023-05-03        5.2  City3
3  2023-05-04        4.0  City4
4  2023-05-05        6.1  City5

#your code here

# a quick 3x4 array
data_2d = numpy.arange(12).reshape(3, 4)

df_from_array = pandas.DataFrame(data=data_2d,
                                 index=["row1", "row2", "row3"],
                                 columns=["column1", "column2", "column3", "column4"]
                                 )
# creating a file
df_from_array.to_csv("example_7.csv")

# reading back in
df_from_csv = pandas.read_csv("example_7.csv")
print(df_from_csv)

# set_index method
df_from_csv = df_from_csv.set_index("Unnamed: 0")
print(df_from_csv)

# keyword argument method
df_from_csv = pandas.read_csv("example_7.csv", index_col=0)
print(df_from_csv)

  Unnamed: 0  column1  column2  column3  column4
0       row1        0        1        2        3
1       row2        4        5        6        7
2       row3        8        9       10       11
            column1  column2  column3  column4
Unnamed: 0                                    
row1              0        1        2        3
row2              4        5        6        7
row3              8        9       10       11
      column1  column2  column3  column4
row1        0        1        2        3
row2        4        5        6        7
row3        8        9       10       11

#creating a date range index over 30 days
dates = pandas.date_range('2022-09-01', '2022-09-30')
#creating random prices
price1 = numpy.round(numpy.random.rand(30)*10 + 10, decimals=2)
price2 = numpy.round(numpy.random.rand(30)*10 + 10, decimals=2)
#your code here

Intermediate Python¶

"DataFrame Building"¶

Pandas Module¶

Pandas DataFrame Class¶

DataFrames are like Spreadsheets¶

Building DataFrames from Data¶

Example 0¶

DataFrame by Columns¶

Example 1¶

Exercise 1¶

DataFrame by Rows¶

Example 2¶

Exercise 2¶

DataFrame from a 2D Array¶

Example 3¶

Exercise 3¶

DataFrame from a File¶

Example 4¶

Exercise 4¶

DataFrame to a File¶

Example 5¶

Exercise 5¶

Fixing DataFrame Columns¶

Example 6¶

Exercise 6¶

Fixing DataFrame Index¶

Example 7¶

Exercise 7¶

	column1	column2
row1	`data`	`data`
row2	`data`	`data`