X-Git-Url: http://unremediatedgender.space/source?p=Ultimately_Untrue_Thought.git;a=blobdiff_plain;f=notes%2Fdeflation.py;fp=notes%2Fdeflation.py;h=77efe237e13e1f5799e654c01f2363ccc7d6b751;hp=0000000000000000000000000000000000000000;hb=1b6eeea9d643c0613470ef1bb12382291168ddea;hpb=e1f4985537c1a3954f765f932cd8a37fcbd45219

diff --git a/notes/deflation.py b/notes/deflation.py
new file mode 100644
index 0000000..77efe23
--- /dev/null
+++ b/notes/deflation.py
@@ -0,0 +1,61 @@
+from math import sqrt
+from statistics import mean, variance
+
+from numpy.random import normal, seed
+
+# seed the random number generator for reproducibility of given figures,
+# commment this out to run a new experiment
+seed(1)
+
+def cohens_d(X, Y):
+    return (
+        (mean(X) + mean(Y)) /
+        sqrt(
+            (len(X)*variance(X) + len(Y)*variance(Y)) /
+            (len(X) + len(Y))
+        )
+    )
+
+def population_with_error(Î¼, Ï, n):
+    def trait():
+        return normal(Î¼, 1)
+    def measurement_error():
+        return normal(0, Ï)
+    return [trait() + measurement_error() for _ in range(n)]
+
+
+# trait differs by 1 standard deviation
+adjusted_f = population_with_error(1, 0, 10000)
+adjusted_m = population_with_error(0, 0, 10000)
+
+# as above, but with 0.5 standard units measurment error
+measured_f = population_with_error(1, 0.5, 10000)
+measured_m = population_with_error(0, 0.5, 10000)
+
+smart_d = cohens_d(adjusted_f, adjusted_m)
+print(smart_d)  # 1.0193773432617055 â dâ1.0, as expected!
+
+naÃ¯ve_d = cohens_d(measured_f, measured_m)
+print(naÃ¯ve_d)  # 0.8953395386313235
+
+
+def performance(g, Ï_g, s, n):
+    def general_ability():
+        return normal(g, Ï_g)
+    def special_ability():
+        return normal(s, 1)
+    return [general_ability() + special_ability() for _ in range(n)]
+
+# â one standard deviation better than â at the special factor
+population_f = performance(0, 1, 1, 10000)
+population_m = performance(0, 1, 0, 10000)
+
+# ... but suppose we control/match for general intelligence
+matched_f = performance(0, 0, 1, 10000)
+matched_m = performance(0, 0, 0, 10000)
+
+population_d = cohens_d(population_f, population_m)
+print(population_d)  # 0.7287587808164793
+
+matched_d = cohens_d(matched_f, matched_m)
+print(matched_d)  # 1.018362581243161