From the /c/coding_help community on Chambers

I have the following code: ```python import numpy as np def histHist(data, nbins): min_val = np.min(data) max_val = np.max(data) bins = np.linspace(min_val, max_val, nbins + 1) f = np.zeros(nbins) for i in range(0, nbins - 1): if i == nbins - 1: m = np.size(np.extract((data >= bins[i]) & (data <= bins[i + 1]), data)) f[i] = m / (bins[i + 1] - bins[i]) else: m = np.size(np.extract((data >= bins[i]) & (data < bins[i + 1]), data)) f[i] = m / (bins[i + 1] - bins[i]) return f, bins ``` And am trying to run the following code: ```python from scipy.stats import norm import numpy as np import matplotlib.pyplot as plt import seaborn as sns from histHist import histHist numoons = 500 seednum = 1928348123 lowersamps = 100 numpoints = 10000 np.random.seed(seednum + 0) print("Generating moons") data = norm.rvs(size=(2, numpoints), scale=4, random_state=seednum) sns.set() sns.set_context("notebook", font_scale=1.5, rc={"lines.linewidth": 2.5, 'figure.figsize': (10, 9.5)}) sns.set_style("ticks") fig = plt.figure(1) plt.figure(figsize=(8, 6)) sns.kdeplot(data[0], data[1], gridsize=50, shade=True, shade_lowest=True, cmap='viridis', bw=.2) plt.show() fig = plt.figure(2) sns.kdeplot(data[0], data[1], gridsize=50, shade=True, shade_lowest=True, cmap='viridis', bw=.2) plt.show() fig = plt.figure(3) sns.kdeplot(data[0], data[1], gridsize=50, shade=True, shade_lowest=True, cmap='viridis', bw=.2) plt.show() for i in range(lowersamps): print("Setup example %u" % (i + 1)) oonsamp = np.random.permutation(numpoints)[:numoons].squeeze() moons2 = np.random.permutation(numpoints)[:numoons].squeeze() np.random.seed(seednum + i + 1) print("Generating background") background = norm.rvs(size=(2, numoons), loc=[5, 0], scale=[2, 5], random_state=seednum + i + 1) # Pick which points we're going to use data[1, oonsamp] -= 4 # And create our samples data_sample = data[:, oonsamp] moons = data[:, moons2] # And manually move the points background[1, :] -= 4 # Append background onto our sample data_sample = np.append(data_sample, background, 1) # And bins y_min = np.amin(data[1, :]) y_max = np.amax(data[1, :]) dy = (y_max - y_min) / 50 newymin = y_min + 4 newymax = y_max - 4 print("Computing bins") bins = np.linspace(newymin, newymax, 50) print("Computing Hist") p_y, bin = histHist(data[1, :], 100) p_moons, mbin = histHist(data[1, moons2], 100) p_bkg, bbin = histHist(background[1, :], 100) print("Computing Guess") p_g = np.zeros(len(bins) - 1) for j in range(2, len(bins) - 3): p_g[j] = np.sum(p_y[(mbin[1:-1] >= bins[j]) & (mbin[1:-1] <= bins[j + 1])]) - \ np.sum(p_bkg[(bbin[1:-1] >= bins[j]) & (mbin[1:-1] <= bins[j + 1])]) # Compute the Poisson error in our histogram print("Computing Errors") err = np.zeros(len(bins) - 1) for k in range(2, len(bins) - 3): before = np.extract((data[1, :] < bins[k - 2]) & (data[1, :] >= bins[k - 3]), data[1, :]) after = np.extract((data[1, :] < bins[k + 1]) & (data[1, :] >= bins[k]), data[1, :]) upper = np.extract((data[1, :] < bins[k + 3]) & (data[1, :] >= bins[k + 2]), data[1, :]) bot = np.extract((data[1, :] < bins[k - 1]) & (data[1, :] >= bins[k]), data[1, :]) err[k] = np.std([ np.size(before), np.size(after), np.size(upper), np.size(bot), ]) print("Plotting") fig = plt.figure(i + 1) plt.figure(figsize=(8, 6)) for j in range(1, len(bins) - 2): cut = np.extract((data[1, :] < bins[j + 1]) & (data[1, :] >= bins[j]), data[1, :]) plt.fill_between([bins[j], bins[j + 1]], np.size(cut) / (bins[j + 1] - bins[j]), color='red', edgecolor='black', label='Data', alpha=0.5) plt.fill_between([bins[j], bins[j + 1]], p_moons[j], color='blue', edgecolor='black', label='Star Light', alpha=0.5) plt.fill_between([bins[j], bins[j + 1]], p_bkg[j], color='green', edgecolor='black', label='Background', alpha=0.5) plt.fill_between([bins[j], bins[j + 1]], p_g[j], color='black', edgecolor='black', label='Guess', alpha=0.5) handles, labels = plt.gca().get_legend_handles_labels() plt.legend(handles=handles[1:], labels=labels[1:], loc='lower right') plt.xlabel('y (kpc)') plt.ylabel('Counts/kpc') plt.xlim(-40, 40) plt.title('Counts/ kpc vs. Height') plt.show() fig = plt.figure(i + 4) plt.figure(figsize=(8, 6)) for j in range(1, len(bins) - 2): cut = np.extract((data[1, :] < bins[j + 1]) & (data[1, :] >= bins[j]), data[1, :]) plt.fill_between([bins[j], bins[j + 1]], [np.size(cut) / (bins[j + 1] - bins[j]), np.size(cut) / (bins[j + 1] - bins[j])], color='red', edgecolor='black', label='Data', alpha=0.5) plt.fill_between([bins[j], bins[j + 1]], [p_moons[j] - err[j], p_moons[j] + err[j]], color='blue', edgecolor='black', label='Star Light', alpha=0.5) plt.fill_between([bins[j], bins[j + 1]], [p_g[j] - err[j], p_g[j] + err[j]], color='black', edgecolor='black', label='Guess', alpha=0.5) handles, labels = plt.gca().get_legend_handles_labels() plt.legend(handles=handles[1:], labels=labels[1:], loc='lower right') plt.xlabel('y (kpc)') plt.ylabel('Counts/kpc') plt.xlim(-40, 40) plt.title('Counts/ kpc vs. Height') plt.show() ``` I get the following error: `line 16, in histHist m = np.size(np.extract((data >= bins[i]) & (data < bins[i + 1]), data))` `TypeError: '<' not supported between instances of 'float' and 'str'` I believe the error is coming because `np.extract()` is returning strings, but I have no idea why it would return strings and how to get it to return the numbers as usual. I also tried replacing the `&` with `np.logical_and()` but it still doesn't work. What do I do? What do I do?

HistHist & Bins

Comments (4) 5928 👁️