import pandas as pd
import numpy as np

potsdam_data = pd.read_csv("https://userpage.fu-berlin.de/soga/data/raw-data/SaekularPotsdammonthmeantemp1893-2018.txt",
                           skiprows = 2)

potsdam_january_means_1958_1988 = potsdam_data.loc[(potsdam_data.Year >= 1958) & (potsdam_data.Year <= 1988),
                                                   ["Year", "Jan"]]

potsdam_january_means_1989_2018 = potsdam_data.loc[(potsdam_data.Year >= 1989) & (potsdam_data.Year <= 2018),
                                                   ["Year", "Jan"]]


### your solution


from scipy import stats

alpha = 0.05

test_result = stats.ttest_1samp(potsdam_january_means_1989_2018["Jan"],
                                np.mean(potsdam_january_means_1958_1988["Jan"]),
                                alternative = "two-sided")

text = "Because the p value ({}) is lower than the error level alpha ({})\nthe test result indicates" + " a significant difference between these\ntwo time periods to a confidence level of {}."

print(text.format(round(test_result.pvalue, 4), alpha, 1 - alpha))


yield_seed_1 = [48, 45, 47, 43, 59, 51, 49, 55, 47, 56, 47, 54]
yield_seed_2 = [50, 48, 44, 52, 42, 42, 47, 43, 55, 45, 51, 42]

### your solution


from scipy import stats

alpha = 0.05

test_result = stats.bartlett(yield_seed_1, yield_seed_2)
text = "Because the p-value ({}) is greater than the error level alpha ({})\nwe do not reject H0 and assume equal variances."
print(text.format(round(test_result.pvalue, 2), alpha))

test_result = stats.ttest_ind(yield_seed_1, yield_seed_2, equal_var = True) 
text = "Because the p-value ({}) is greater than the error level alpha ({})\nwe do not reject H0 and cannot confirm significant differences in crop yield between the two seeds."
print(text.format(round(test_result.pvalue, 2), alpha))


layer_1 = [3.13, 2.92, 2.71, 4, 3.62, 3.87]
layer_2 = [3.03, 3.18, 2.91, 2.75, 3.14]

### your solution


from scipy import stats

alpha = 0.05

test_result = stats.bartlett(layer_1, layer_2)
text = "Because the p-value ({}) is smaler than the error level alpha ({})\nwe reject H0 and assume that the variance of both sample are not equal."
print(text.format(round(test_result.pvalue, 3), alpha))

test_result = stats.ttest_ind(layer_1, layer_2, equal_var = False) 
text = "Because the p-value ({}) is greater than the error level alpha ({})\nwe do not reject H0 and and cannot confirm significant differences in depositional conditions of the two layers."
print(text.format(round(test_result.pvalue, 3), alpha))