soybean_file = 'soybean_data.csv'

# Opens the file
with open('soybean_data.csv') as file:

    # List for holding line information
    line_list = []
    # Iterates through lines
    for line in file:
        # Adds line to list
        line_list.append(line)

# Prints the header of the file
print(line_list[0])
# Prints the first entry of the file
print(line_list[1])

Parameters,Random ,Plant Height (PH),Number of Pods (NP),Biological Weight (BW),Sugars (Su),Relative Water Content in Leaves (RWCL),ChlorophyllA663,Chlorophyllb649,Protein Percentage (PPE),Weight of 300 Seeds (W3S),Leaf Area Index (LAI),Seed Yield per Unit Area (SYUA),Number of Seeds per Pod (NSP),Protein Content (PCO)

C1S1G5,R1,50.5,130.3,111.0,0.433,0.732,1.4,3.1,33.2,33.6,0.08,5567.4,1.86,0.82

print("Line 1\nLine 2")

Line 1
Line 2

# Opens the file
with open('soybean_data.csv') as file:

    # List for holding line information
    line_list = []
    # Iterates through lines
    for line in file:
        # Strips the line of the newline character
        str_line = line.strip('\n')
        # Adds stripped line to list
        line_list.append(str_line)

# Prints the header of the file
print(line_list[0])
# Prints the first entry of the file
print(line_list[1])

Parameters,Random ,Plant Height (PH),Number of Pods (NP),Biological Weight (BW),Sugars (Su),Relative Water Content in Leaves (RWCL),ChlorophyllA663,Chlorophyllb649,Protein Percentage (PPE),Weight of 300 Seeds (W3S),Leaf Area Index (LAI),Seed Yield per Unit Area (SYUA),Number of Seeds per Pod (NSP),Protein Content (PCO)
C1S1G5,R1,50.5,130.3,111.0,0.433,0.732,1.4,3.1,33.2,33.6,0.08,5567.4,1.86,0.82

# Opens the file
with open('soybean_data.csv') as file:

    # Creates a list for each column
    param_list = []
    height_list = []
    pod_list = []
    weight_list = []
    
    # Reads in header line
    file.readline()

    # Iterates through lines
    for line_num in range(1, 1000):

        # Reads in a line
        line = file.readline()
        # Strips the line of the newline character
        str_line = line.strip('\n')
        # Splits the line by comma
        spl_line = str_line.split(',')

        # Adds information to each list
        param_list.append(spl_line[0])
        height_list.append(float(spl_line[2]))
        pod_list.append(float(spl_line[3]))
        weight_list.append(float(spl_line[4]))

    # Creates a dictionary of the selected soybean data
    soybean_dict = {'Parameters': param_list, 'Height': height_list, 'Pod Number': pod_list, 'Weight': weight_list}

# Calculate the average height of soybeans
avg_height = sum(list(soybean_dict['Height']))/len(soybean_dict['Height'])
print(f"The average height of the soybean plants is {round(avg_height,2)}.")

The average height of the soybean plants is 49.93.

# Visualize the relationship between soybean height and soybean weight
import matplotlib.pyplot as plt

plt.scatter(soybean_dict['Height'], soybean_dict['Weight'], c = 'r')
plt.xlabel('Soybean Height')
plt.ylabel('Soybean Weight')
plt.title("Soybean Height vs. Soybean Weight")

Text(0.5, 1.0, 'Soybean Height vs. Soybean Weight')

# Calculates the data averages
avg_height = sum(list(soybean_dict['Height']))/len(soybean_dict['Height'])
avg_pod_num = sum(list(soybean_dict['Pod Number']))/len(soybean_dict['Pod Number'])
avg_weight = sum(list(soybean_dict['Weight']))/len(soybean_dict['Weight'])

# Opens averages file
with open('soybean_averages.txt', 'w') as file:

    # Writes information to the file
    file.write("Soybean averages:\n")
    file.write(f"The average soybean height is {round(avg_height, 2)}.\n")
    file.write(f"The average soybean pod number is {round(avg_pod_num, 2)}.\n")
    file.write(f"The average soybean weight is {round(avg_weight, 2)}.\n")

!more soybean_averages.txt

Soybean averages:
The average soybean height is 49.93.
The average soybean pod number is 145.51.
The average soybean weight is 114.77.

# Imports json package
import json

# Writes our soybean dictionary to a json file
with open('soybean_data.json', 'w') as file:
    json.dump(soybean_dict, file)

# Reads in the soybean data json
with open('soybean_data.json', 'r') as file:
    new_soybean_dict = json.load(file)

# Calculates the data averages from the new dictionary
avg_height = sum(list(new_soybean_dict['Height']))/len(new_soybean_dict['Height'])
avg_pod_num = sum(list(new_soybean_dict['Pod Number']))/len(new_soybean_dict['Pod Number'])
avg_weight = sum(list(new_soybean_dict['Weight']))/len(new_soybean_dict['Weight'])

# Prints out information about the loaded dictionary
print(f"The opened json file is {type(new_soybean_dict)}.")
print(f"The keys of the new dictionary are {new_soybean_dict.keys()}")
print(f"The average soybean height is {round(avg_height, 2)}.")
print(f"The average soybean pod number is {round(avg_pod_num, 2)}.")
print(f"The average soybean weight is {round(avg_weight, 2)}.")

The opened json file is <class 'dict'>.
The keys of the new dictionary are dict_keys(['Parameters', 'Height', 'Pod Number', 'Weight'])
The average soybean height is 49.93.
The average soybean pod number is 145.51.
The average soybean weight is 114.77.

Reading and Writing Files¶

Introduction to Reading and Writing Files¶

Reading Text From Files¶

Writing Text to Files¶

Reading Data From and Writing Data to Files¶