diff --git a/FIDDLE/helpers.py b/FIDDLE/helpers.py
index 22fe41e..101498d 100644
--- a/FIDDLE/helpers.py
+++ b/FIDDLE/helpers.py
@@ -153,10 +153,10 @@ def smart_qcut_dummify(x, bin_edges, use_ordinal_encoding=False):
out = pd.get_dummies(x, prefix=x.name)
else:
if use_ordinal_encoding:
- col_names = ['{}>={}'.format(z.name, bin_edge) for bin_edge in bin_edges[:-1]]
+ col_names = ['{}>{}'.format(z.name, bin_edge) for bin_edge in bin_edges[:-1]]
out = pd.DataFrame(0, z.index, col_names)
for i, bin_edge in enumerate(bin_edges[:-1]):
- out.loc[m, col_names[i]] = (z.loc[m] >= bin_edge).astype(int)
+ out.loc[m, col_names[i]] = (z.loc[m] > bin_edge).astype(int)
out = pd.concat([out, pd.get_dummies(z.where(~m, np.nan), prefix=z.name)], axis=1)
else:
z.loc[m] = pd.cut(z.loc[m].astype(float).to_numpy(), bin_edges, duplicates='drop', include_lowest=True)
@@ -179,7 +179,7 @@ def smart_dummify_impute(x):
def make_float(v):
try:
return float(v)
- except ValueError:
+ except (ValueError, TypeError):
return v
assert False
@@ -187,7 +187,7 @@ def is_numeric(v):
try:
float(v)
return True
- except ValueError:
+ except (ValueError, TypeError):
return False
assert False
diff --git a/README.md b/README.md
index 3063b42..8f6c37e 100644
--- a/README.md
+++ b/README.md
@@ -81,8 +81,8 @@ s = sparse.load_npz('{data_path}/s.npz'.format(data_path=...)).todense()
Example usage:
```bash
python -m FIDDLE.run \
- --data_path='./test/small_test/' \
- --population='./test/small_test/pop.csv' \
+ --data_path='./tests/small_test/' \
+ --population='./tests/small_test/pop.csv' \
--T=24 --dt=5 \
--theta_1=0.001 --theta_2=0.001 --theta_freq=1 \
--stats_functions 'min' 'max' 'mean'
diff --git a/tests/icd_test/Run.ipynb b/tests/icd_test/Run.ipynb
index c83b13c..1f903ba 100644
--- a/tests/icd_test/Run.ipynb
+++ b/tests/icd_test/Run.ipynb
@@ -4,15 +4,7 @@
"cell_type": "code",
"execution_count": 1,
"metadata": {},
- "outputs": [
- {
- "name": "stdout",
- "output_type": "stream",
- "text": [
- "zsh:1: no matches found: output-*/\n"
- ]
- }
- ],
+ "outputs": [],
"source": [
"!rm -rf output-*/"
]
@@ -111,11 +103,11 @@
"--------------------------------------------------------------------------------\n",
"(N × ^d) table :\t (200, 19)\n",
"number of missing entries :\t 2816 out of 3800 total\n",
- "Time elapsed: 0.025395 seconds\n",
+ "Time elapsed: 0.012328 seconds\n",
"\n",
"Output\n",
"S_all, binary features :\t (200, 21)\n",
- "Time elapsed: 0.171098 seconds\n",
+ "Time elapsed: 0.101575 seconds\n",
"\n",
"--------------------------------------------------------------------------------\n",
"3-A) Post-filter time-invariant data\n",
@@ -123,13 +115,12 @@
"Original : 21\n",
"Nearly-constant: 0\n",
"Correlated : 0\n",
- "Time elapsed: 0.178303 seconds\n",
+ "Time elapsed: 0.104368 seconds\n",
"\n",
"Output\n",
"S: shape=(200, 21), density=0.234\n",
- "Total time: 0.180898 seconds\n",
- "\n",
- "\u001b[0m"
+ "Total time: 0.106207 seconds\n",
+ "\n"
]
}
],
@@ -732,11 +723,11 @@
"--------------------------------------------------------------------------------\n",
"(N × ^d) table :\t (200, 129)\n",
"number of missing entries :\t 23337 out of 25800 total\n",
- "Time elapsed: 0.057711 seconds\n",
+ "Time elapsed: 0.034244 seconds\n",
"\n",
"Output\n",
"S_all, binary features :\t (200, 129)\n",
- "Time elapsed: 0.830818 seconds\n",
+ "Time elapsed: 0.558320 seconds\n",
"\n",
"--------------------------------------------------------------------------------\n",
"3-A) Post-filter time-invariant data\n",
@@ -744,13 +735,12 @@
"Original : 129\n",
"Nearly-constant: 0\n",
"Correlated : 2\n",
- "Time elapsed: 0.840801 seconds\n",
+ "Time elapsed: 0.564048 seconds\n",
"\n",
"Output\n",
"S: shape=(200, 127), density=0.097\n",
- "Total time: 0.844234 seconds\n",
- "\n",
- "\u001b[0m"
+ "Total time: 0.567541 seconds\n",
+ "\n"
]
}
],
@@ -1353,11 +1343,11 @@
"--------------------------------------------------------------------------------\n",
"(N × ^d) table :\t (200, 455)\n",
"number of missing entries :\t 86795 out of 91000 total\n",
- "Time elapsed: 0.112510 seconds\n",
+ "Time elapsed: 0.092419 seconds\n",
"\n",
"Output\n",
"S_all, binary features :\t (200, 455)\n",
- "Time elapsed: 2.377939 seconds\n",
+ "Time elapsed: 1.690453 seconds\n",
"\n",
"--------------------------------------------------------------------------------\n",
"3-A) Post-filter time-invariant data\n",
@@ -1365,13 +1355,12 @@
"Original : 455\n",
"Nearly-constant: 0\n",
"Correlated : 87\n",
- "Time elapsed: 2.428499 seconds\n",
+ "Time elapsed: 1.715216 seconds\n",
"\n",
"Output\n",
"S: shape=(200, 368), density=0.055\n",
- "Total time: 2.435949 seconds\n",
- "\n",
- "\u001b[0m"
+ "Total time: 1.719981 seconds\n",
+ "\n"
]
}
],
@@ -1916,7 +1905,7 @@
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
- "version": "3.8.6"
+ "version": "3.8.5"
}
},
"nbformat": 4,
diff --git a/tests/large_test/Run.ipynb b/tests/large_test/Run.ipynb
index 3033773..c36c240 100644
--- a/tests/large_test/Run.ipynb
+++ b/tests/large_test/Run.ipynb
@@ -91,11 +91,11 @@
"--------------------------------------------------------------------------------\n",
"(N × ^d) table :\t (200, 12)\n",
"number of missing entries :\t 4 out of 2400 total\n",
- "Time elapsed: 0.030966 seconds\n",
+ "Time elapsed: 0.018219 seconds\n",
"\n",
"Output\n",
"S_all, binary features :\t (200, 84)\n",
- "Time elapsed: 0.226954 seconds\n",
+ "Time elapsed: 0.202440 seconds\n",
"\n",
"--------------------------------------------------------------------------------\n",
"3-A) Post-filter time-invariant data\n",
@@ -103,11 +103,11 @@
"Original : 84\n",
"Nearly-constant: 0\n",
"Correlated : 7\n",
- "Time elapsed: 0.232384 seconds\n",
+ "Time elapsed: 0.208578 seconds\n",
"\n",
"Output\n",
"S: shape=(200, 77), density=0.145\n",
- "Total time: 0.235823 seconds\n",
+ "Total time: 0.211770 seconds\n",
"\n",
"\n",
"--------------------------------------------------------------------------------\n",
@@ -121,8 +121,8 @@
"\n",
"Transforming each example...\n",
"Batches of size 100: 2\n",
- "100%|█████████████████████████████████████████████| 2/2 [00:38<00:00, 19.13s/it]\n",
- "\u001b[0m\u001b[0m\u001b[0m\u001b[0m\n",
+ "100%|█████████████████████████████████████████████| 2/2 [00:25<00:00, 12.88s/it]\n",
+ "\n",
"Parallel processing done\n",
"DONE: Transforming each example...\n",
"(freq) number of missing entries :\t 996 out of 200×4×5=4000 total\n",
@@ -131,40 +131,39 @@
"(non-freq) number of missing entries :\t 1510389 out of 200×4×1953=1562400 total\n",
"\n",
"(N × L × ^D) table :\t (200, 4, 1983)\n",
- "Time elapsed: 39.815167 seconds\n",
+ "Time elapsed: 27.030075 seconds\n",
"Discretizing features...\n",
"\n",
"Processing 1978 non-boolean variable columns...\n",
" Computing bin edges for numeric variables...\n",
- "100%|██████████████████████████████████████| 1978/1978 [00:06<00:00, 328.38it/s]\n",
+ "100%|██████████████████████████████████████| 1978/1978 [00:04<00:00, 399.11it/s]\n",
" Discretizing variables to binary features\n",
- "100%|██████████████████████████████████████| 1978/1978 [00:09<00:00, 201.94it/s]\n",
- "\u001b[0m\u001b[0m\u001b[0m\u001b[0mFinished discretizing features\n",
+ "100%|██████████████████████████████████████| 1978/1978 [00:10<00:00, 193.81it/s]\n",
+ "Finished discretizing features\n",
"\n",
"Output\n",
- "X_all: shape=(200, 4, 3557), density=0.025\n",
- "Time elapsed: 57.075922 seconds\n",
+ "X_all: shape=(200, 4, 3582), density=0.025\n",
+ "Time elapsed: 43.360937 seconds\n",
"\n",
"--------------------------------------------------------------------------------\n",
"3-B) Post-filter time-dependent data\n",
"--------------------------------------------------------------------------------\n",
- "(200, 4, 3557) 0.02504322462749508\n",
- "Original : 3557\n",
+ "(200, 4, 3582) 0.024868439419318815\n",
+ "Original : 3582\n",
"Nearly-constant: 77\n",
- "*** time: 8.839366912841797\n",
- "Correlated : 1137\n",
- "*** time: 16.099601984024048\n",
+ "*** time: 5.742851972579956\n",
+ "Correlated : 1144\n",
+ "*** time: 10.776153087615967\n",
"\n",
"Output\n",
- "X: shape=(200, 4, 2343), density=0.034\n",
- "(200, 4, 2343) 0.03446382842509603\n",
- "Time elapsed: 73.185729 seconds\n",
+ "X: shape=(200, 4, 2361), density=0.034\n",
+ "(200, 4, 2361) 0.034196844557390936\n",
+ "Time elapsed: 54.146272 seconds\n",
"\n",
"Output\n",
- "X: shape=(200, 4, 2343), density=0.034\n",
- "Total time: 73.237736 seconds\n",
- "\n",
- "\u001b[0m"
+ "X: shape=(200, 4, 2361), density=0.034\n",
+ "Total time: 54.197789 seconds\n",
+ "\n"
]
}
],
@@ -1054,7 +1053,7 @@
" \n",
" \n",
"\n",
- "
800 rows × 3557 columns
\n",
+ "800 rows × 3582 columns
\n",
""
],
"text/plain": [
@@ -1184,7 +1183,7 @@
" [2.0, 3.0) 0 \n",
" [3.0, 4.0) 0 \n",
"\n",
- "[800 rows x 3557 columns]"
+ "[800 rows x 3582 columns]"
]
},
"metadata": {},
@@ -1220,7 +1219,7 @@
},
{
"cell_type": "code",
- "execution_count": 5,
+ "execution_count": 1,
"metadata": {},
"outputs": [],
"source": [
@@ -1229,7 +1228,7 @@
},
{
"cell_type": "code",
- "execution_count": 6,
+ "execution_count": 2,
"metadata": {},
"outputs": [
{
@@ -1293,23 +1292,23 @@
"--------------------------------------------------------------------------------\n",
"(N × ^d) table :\t (200, 12)\n",
"number of missing entries :\t 4 out of 2400 total\n",
- "Time elapsed: 0.018090 seconds\n",
+ "Time elapsed: 0.016319 seconds\n",
"\n",
"Output\n",
"S_all, binary features :\t (200, 84)\n",
- "Time elapsed: 0.180124 seconds\n",
+ "Time elapsed: 0.277533 seconds\n",
"\n",
"--------------------------------------------------------------------------------\n",
"3-A) Post-filter time-invariant data\n",
"--------------------------------------------------------------------------------\n",
"Original : 84\n",
- "Nearly-constant: 2\n",
- "Correlated : 7\n",
- "Time elapsed: 0.184865 seconds\n",
+ "Nearly-constant: 0\n",
+ "Correlated : 8\n",
+ "Time elapsed: 0.287127 seconds\n",
"\n",
"Output\n",
- "S: shape=(200, 75), density=0.176\n",
- "Total time: 0.188878 seconds\n",
+ "S: shape=(200, 76), density=0.200\n",
+ "Total time: 0.291958 seconds\n",
"\n",
"\n",
"--------------------------------------------------------------------------------\n",
@@ -1323,8 +1322,8 @@
"\n",
"Transforming each example...\n",
"Batches of size 100: 2\n",
- "100%|█████████████████████████████████████████████| 2/2 [00:35<00:00, 17.88s/it]\n",
- "\u001b[0m\u001b[0m\u001b[0m\u001b[0m\n",
+ "100%|█████████████████████████████████████████████| 2/2 [00:24<00:00, 12.47s/it]\n",
+ "\n",
"Parallel processing done\n",
"DONE: Transforming each example...\n",
"(freq) number of missing entries :\t 996 out of 200×4×5=4000 total\n",
@@ -1333,40 +1332,39 @@
"(non-freq) number of missing entries :\t 1510389 out of 200×4×1953=1562400 total\n",
"\n",
"(N × L × ^D) table :\t (200, 4, 1983)\n",
- "Time elapsed: 37.294821 seconds\n",
+ "Time elapsed: 26.302975 seconds\n",
"Discretizing features...\n",
"\n",
"Processing 1978 non-boolean variable columns...\n",
" Computing bin edges for numeric variables...\n",
- "100%|██████████████████████████████████████| 1978/1978 [00:05<00:00, 377.85it/s]\n",
+ "100%|██████████████████████████████████████| 1978/1978 [00:04<00:00, 399.19it/s]\n",
" Discretizing variables to binary features\n",
- "100%|██████████████████████████████████████| 1978/1978 [00:14<00:00, 139.24it/s]\n",
- "\u001b[0m\u001b[0m\u001b[0m\u001b[0mFinished discretizing features\n",
+ "100%|██████████████████████████████████████| 1978/1978 [00:09<00:00, 208.45it/s]\n",
+ "Finished discretizing features\n",
"\n",
"Output\n",
- "X_all: shape=(200, 4, 3587), density=0.039\n",
- "Time elapsed: 58.029910 seconds\n",
+ "X_all: shape=(200, 4, 3587), density=0.036\n",
+ "Time elapsed: 41.840676 seconds\n",
"\n",
"--------------------------------------------------------------------------------\n",
"3-B) Post-filter time-dependent data\n",
"--------------------------------------------------------------------------------\n",
- "(200, 4, 3587) 0.03878101477557848\n",
+ "(200, 4, 3587) 0.036313771954279345\n",
"Original : 3587\n",
- "Nearly-constant: 3\n",
- "*** time: 7.768070220947266\n",
- "Correlated : 1194\n",
- "*** time: 14.502072095870972\n",
+ "Nearly-constant: 0\n",
+ "*** time: 5.449969053268433\n",
+ "Correlated : 1173\n",
+ "*** time: 10.53041410446167\n",
"\n",
"Output\n",
- "X: shape=(200, 4, 2390), density=0.048\n",
- "(200, 4, 2390) 0.04819874476987448\n",
- "Time elapsed: 72.538985 seconds\n",
+ "X: shape=(200, 4, 2414), density=0.049\n",
+ "(200, 4, 2414) 0.048544946147473074\n",
+ "Time elapsed: 52.379346 seconds\n",
"\n",
"Output\n",
- "X: shape=(200, 4, 2390), density=0.048\n",
- "Total time: 72.603644 seconds\n",
- "\n",
- "\u001b[0m"
+ "X: shape=(200, 4, 2414), density=0.049\n",
+ "Total time: 52.431078 seconds\n",
+ "\n"
]
}
],
@@ -1384,7 +1382,7 @@
},
{
"cell_type": "code",
- "execution_count": 7,
+ "execution_count": 3,
"metadata": {},
"outputs": [
{
@@ -1417,7 +1415,7 @@
" ADMISSION_TYPE_value_ELECTIVE | \n",
" ADMISSION_TYPE_value_EMERGENCY | \n",
" ADMISSION_TYPE_value_URGENT | \n",
- " AGE_value>=19.737885622780315 | \n",
+ " AGE_value>19.737885622780315 | \n",
" ... | \n",
" RELIGION_value_EPISCOPALIAN | \n",
" RELIGION_value_GREEK ORTHODOX | \n",
@@ -1824,19 +1822,19 @@
"201125 0 1 \n",
"201128 0 1 \n",
"\n",
- " ADMISSION_TYPE_value_URGENT AGE_value>=19.737885622780315 ... \\\n",
- "ID ... \n",
- "200001 0 1 ... \n",
- "200010 0 1 ... \n",
- "200016 0 1 ... \n",
- "200033 0 1 ... \n",
- "200034 0 1 ... \n",
- "... ... ... ... \n",
- "201110 0 1 ... \n",
- "201113 0 1 ... \n",
- "201124 0 1 ... \n",
- "201125 0 1 ... \n",
- "201128 0 1 ... \n",
+ " ADMISSION_TYPE_value_URGENT AGE_value>19.737885622780315 ... \\\n",
+ "ID ... \n",
+ "200001 0 1 ... \n",
+ "200010 0 1 ... \n",
+ "200016 0 1 ... \n",
+ "200033 0 1 ... \n",
+ "200034 0 1 ... \n",
+ "... ... ... ... \n",
+ "201110 0 1 ... \n",
+ "201113 0 1 ... \n",
+ "201124 0 1 ... \n",
+ "201125 0 1 ... \n",
+ "201128 0 1 ... \n",
"\n",
" RELIGION_value_EPISCOPALIAN RELIGION_value_GREEK ORTHODOX \\\n",
"ID \n",
@@ -1941,22 +1939,22 @@
" RR_mask | \n",
" SpO2_mask | \n",
" SysBP_mask | \n",
- " 220048_value_1 | \n",
- " 220048: 1st AV (First degree AV Block) _value_1 | \n",
- " 220048: 3rd AV (Complete Heart Block) _value_1 | \n",
- " 220048: A Flut (Atrial Flutter) _value_1 | \n",
- " 220048: AF (Atrial Fibrillation)_value_1 | \n",
+ " 220046_value>10.0 | \n",
+ " 220046_value>120.0 | \n",
+ " 220047_value>29.0 | \n",
+ " 220047_value>50.0 | \n",
+ " 220047_value>55.0 | \n",
" ... | \n",
- " SysBP_mean>=66.0 | \n",
- " SysBP_mean>=103.4 | \n",
- " SysBP_mean>=114.43333333333334 | \n",
- " SysBP_mean>=125.0 | \n",
- " SysBP_mean>=138.0 | \n",
- " SysBP_max>=66.0 | \n",
- " SysBP_max>=105.0 | \n",
- " SysBP_max>=116.0 | \n",
- " SysBP_max>=127.0 | \n",
- " SysBP_max>=141.0 | \n",
+ " SysBP_mean>66.0 | \n",
+ " SysBP_mean>103.4 | \n",
+ " SysBP_mean>114.43333333333334 | \n",
+ " SysBP_mean>125.0 | \n",
+ " SysBP_mean>138.0 | \n",
+ " SysBP_max>66.0 | \n",
+ " SysBP_max>105.0 | \n",
+ " SysBP_max>116.0 | \n",
+ " SysBP_max>127.0 | \n",
+ " SysBP_max>141.0 | \n",
" \n",
" \n",
" ID | \n",
@@ -1995,9 +1993,9 @@
" 1 | \n",
" 1 | \n",
" 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
+ " 1 | \n",
+ " 1 | \n",
+ " 1 | \n",
" ... | \n",
" 1 | \n",
" 1 | \n",
@@ -2017,7 +2015,7 @@
" 1 | \n",
" 1 | \n",
" 1 | \n",
- " 1 | \n",
+ " 0 | \n",
" 0 | \n",
" 0 | \n",
" 0 | \n",
@@ -2041,7 +2039,7 @@
" 1 | \n",
" 1 | \n",
" 1 | \n",
- " 1 | \n",
+ " 0 | \n",
" 0 | \n",
" 0 | \n",
" 0 | \n",
@@ -2054,7 +2052,7 @@
" 0 | \n",
" 1 | \n",
" 1 | \n",
- " 1 | \n",
+ " 0 | \n",
" 0 | \n",
" 0 | \n",
"
\n",
@@ -2065,7 +2063,7 @@
" 1 | \n",
" 1 | \n",
" 1 | \n",
- " 1 | \n",
+ " 0 | \n",
" 0 | \n",
" 0 | \n",
" 0 | \n",
@@ -2090,9 +2088,9 @@
" 0 | \n",
" 0 | \n",
" 0 | \n",
+ " 1 | \n",
" 0 | \n",
- " 0 | \n",
- " 0 | \n",
+ " 1 | \n",
" 0 | \n",
" 0 | \n",
" ... | \n",
@@ -2141,10 +2139,10 @@
" 1 | \n",
" 1 | \n",
" 1 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
+ " 1 | \n",
+ " 1 | \n",
+ " 1 | \n",
+ " 1 | \n",
" ... | \n",
" 1 | \n",
" 1 | \n",
@@ -2191,7 +2189,7 @@
" 1 | \n",
" 1 | \n",
" 0 | \n",
- " 0 | \n",
+ " 1 | \n",
" 0 | \n",
" 0 | \n",
" ... | \n",
@@ -2213,7 +2211,7 @@
" 1 | \n",
" 0 | \n",
" 1 | \n",
- " 1 | \n",
+ " 0 | \n",
" 0 | \n",
" 0 | \n",
" 0 | \n",
@@ -2237,7 +2235,7 @@
" 1 | \n",
" 0 | \n",
" 1 | \n",
- " 1 | \n",
+ " 0 | \n",
" 0 | \n",
" 0 | \n",
" 0 | \n",
@@ -2274,131 +2272,89 @@
" [2.0, 3.0) 1 1 1 0 1 \n",
" [3.0, 4.0) 1 1 1 0 1 \n",
"\n",
- " 220048_value_1 \\\n",
- "ID t_range \n",
- "200001 [0.0, 1.0) 1 \n",
- " [1.0, 2.0) 1 \n",
- " [2.0, 3.0) 1 \n",
- " [3.0, 4.0) 1 \n",
- "200010 [0.0, 1.0) 0 \n",
- "... ... \n",
- "201125 [3.0, 4.0) 1 \n",
- "201128 [0.0, 1.0) 0 \n",
- " [1.0, 2.0) 1 \n",
- " [2.0, 3.0) 1 \n",
- " [3.0, 4.0) 1 \n",
- "\n",
- " 220048: 1st AV (First degree AV Block) _value_1 \\\n",
+ " 220046_value>10.0 220046_value>120.0 220047_value>29.0 \\\n",
+ "ID t_range \n",
+ "200001 [0.0, 1.0) 1 0 1 \n",
+ " [1.0, 2.0) 0 0 0 \n",
+ " [2.0, 3.0) 0 0 0 \n",
+ " [3.0, 4.0) 0 0 0 \n",
+ "200010 [0.0, 1.0) 1 0 1 \n",
+ "... ... ... ... \n",
+ "201125 [3.0, 4.0) 1 1 1 \n",
+ "201128 [0.0, 1.0) 0 0 0 \n",
+ " [1.0, 2.0) 1 0 1 \n",
+ " [2.0, 3.0) 0 0 0 \n",
+ " [3.0, 4.0) 0 0 0 \n",
+ "\n",
+ " 220047_value>50.0 220047_value>55.0 ... SysBP_mean>66.0 \\\n",
+ "ID t_range ... \n",
+ "200001 [0.0, 1.0) 1 1 ... 1 \n",
+ " [1.0, 2.0) 0 0 ... 1 \n",
+ " [2.0, 3.0) 0 0 ... 1 \n",
+ " [3.0, 4.0) 0 0 ... 1 \n",
+ "200010 [0.0, 1.0) 0 0 ... 0 \n",
+ "... ... ... ... ... \n",
+ "201125 [3.0, 4.0) 1 1 ... 1 \n",
+ "201128 [0.0, 1.0) 0 0 ... 0 \n",
+ " [1.0, 2.0) 0 0 ... 1 \n",
+ " [2.0, 3.0) 0 0 ... 1 \n",
+ " [3.0, 4.0) 0 0 ... 1 \n",
+ "\n",
+ " SysBP_mean>103.4 SysBP_mean>114.43333333333334 \\\n",
"ID t_range \n",
- "200001 [0.0, 1.0) 0 \n",
- " [1.0, 2.0) 0 \n",
- " [2.0, 3.0) 0 \n",
- " [3.0, 4.0) 0 \n",
- "200010 [0.0, 1.0) 0 \n",
- "... ... \n",
- "201125 [3.0, 4.0) 0 \n",
- "201128 [0.0, 1.0) 0 \n",
- " [1.0, 2.0) 0 \n",
- " [2.0, 3.0) 0 \n",
- " [3.0, 4.0) 0 \n",
- "\n",
- " 220048: 3rd AV (Complete Heart Block) _value_1 \\\n",
- "ID t_range \n",
- "200001 [0.0, 1.0) 0 \n",
- " [1.0, 2.0) 0 \n",
- " [2.0, 3.0) 0 \n",
- " [3.0, 4.0) 0 \n",
- "200010 [0.0, 1.0) 0 \n",
- "... ... \n",
- "201125 [3.0, 4.0) 0 \n",
- "201128 [0.0, 1.0) 0 \n",
- " [1.0, 2.0) 0 \n",
- " [2.0, 3.0) 0 \n",
- " [3.0, 4.0) 0 \n",
- "\n",
- " 220048: A Flut (Atrial Flutter) _value_1 \\\n",
- "ID t_range \n",
- "200001 [0.0, 1.0) 0 \n",
- " [1.0, 2.0) 0 \n",
- " [2.0, 3.0) 0 \n",
- " [3.0, 4.0) 0 \n",
- "200010 [0.0, 1.0) 0 \n",
- "... ... \n",
- "201125 [3.0, 4.0) 0 \n",
- "201128 [0.0, 1.0) 0 \n",
- " [1.0, 2.0) 0 \n",
- " [2.0, 3.0) 0 \n",
- " [3.0, 4.0) 0 \n",
- "\n",
- " 220048: AF (Atrial Fibrillation)_value_1 ... \\\n",
- "ID t_range ... \n",
- "200001 [0.0, 1.0) 0 ... \n",
- " [1.0, 2.0) 0 ... \n",
- " [2.0, 3.0) 0 ... \n",
- " [3.0, 4.0) 0 ... \n",
- "200010 [0.0, 1.0) 0 ... \n",
- "... ... ... \n",
- "201125 [3.0, 4.0) 0 ... \n",
- "201128 [0.0, 1.0) 0 ... \n",
- " [1.0, 2.0) 0 ... \n",
- " [2.0, 3.0) 0 ... \n",
- " [3.0, 4.0) 0 ... \n",
- "\n",
- " SysBP_mean>=66.0 SysBP_mean>=103.4 \\\n",
- "ID t_range \n",
- "200001 [0.0, 1.0) 1 1 \n",
- " [1.0, 2.0) 1 1 \n",
- " [2.0, 3.0) 1 1 \n",
- " [3.0, 4.0) 1 0 \n",
- "200010 [0.0, 1.0) 0 0 \n",
- "... ... ... \n",
- "201125 [3.0, 4.0) 1 1 \n",
- "201128 [0.0, 1.0) 0 0 \n",
- " [1.0, 2.0) 1 1 \n",
- " [2.0, 3.0) 1 1 \n",
- " [3.0, 4.0) 1 1 \n",
- "\n",
- " SysBP_mean>=114.43333333333334 SysBP_mean>=125.0 \\\n",
+ "200001 [0.0, 1.0) 1 0 \n",
+ " [1.0, 2.0) 1 0 \n",
+ " [2.0, 3.0) 1 1 \n",
+ " [3.0, 4.0) 0 0 \n",
+ "200010 [0.0, 1.0) 0 0 \n",
+ "... ... ... \n",
+ "201125 [3.0, 4.0) 1 1 \n",
+ "201128 [0.0, 1.0) 0 0 \n",
+ " [1.0, 2.0) 1 1 \n",
+ " [2.0, 3.0) 1 1 \n",
+ " [3.0, 4.0) 1 1 \n",
+ "\n",
+ " SysBP_mean>125.0 SysBP_mean>138.0 SysBP_max>66.0 \\\n",
+ "ID t_range \n",
+ "200001 [0.0, 1.0) 0 0 1 \n",
+ " [1.0, 2.0) 0 0 1 \n",
+ " [2.0, 3.0) 0 0 1 \n",
+ " [3.0, 4.0) 0 0 1 \n",
+ "200010 [0.0, 1.0) 0 0 0 \n",
+ "... ... ... ... \n",
+ "201125 [3.0, 4.0) 0 0 1 \n",
+ "201128 [0.0, 1.0) 0 0 0 \n",
+ " [1.0, 2.0) 1 0 1 \n",
+ " [2.0, 3.0) 0 0 1 \n",
+ " [3.0, 4.0) 0 0 1 \n",
+ "\n",
+ " SysBP_max>105.0 SysBP_max>116.0 SysBP_max>127.0 \\\n",
"ID t_range \n",
- "200001 [0.0, 1.0) 0 0 \n",
- " [1.0, 2.0) 0 0 \n",
- " [2.0, 3.0) 1 0 \n",
- " [3.0, 4.0) 0 0 \n",
- "200010 [0.0, 1.0) 0 0 \n",
- "... ... ... \n",
- "201125 [3.0, 4.0) 1 0 \n",
- "201128 [0.0, 1.0) 0 0 \n",
- " [1.0, 2.0) 1 1 \n",
- " [2.0, 3.0) 1 0 \n",
- " [3.0, 4.0) 1 0 \n",
- "\n",
- " SysBP_mean>=138.0 SysBP_max>=66.0 SysBP_max>=105.0 \\\n",
- "ID t_range \n",
- "200001 [0.0, 1.0) 0 1 1 \n",
- " [1.0, 2.0) 0 1 1 \n",
- " [2.0, 3.0) 0 1 1 \n",
- " [3.0, 4.0) 0 1 0 \n",
- "200010 [0.0, 1.0) 0 0 0 \n",
- "... ... ... ... \n",
- "201125 [3.0, 4.0) 0 1 1 \n",
- "201128 [0.0, 1.0) 0 0 0 \n",
- " [1.0, 2.0) 0 1 1 \n",
- " [2.0, 3.0) 0 1 1 \n",
- " [3.0, 4.0) 0 1 1 \n",
- "\n",
- " SysBP_max>=116.0 SysBP_max>=127.0 SysBP_max>=141.0 \n",
- "ID t_range \n",
- "200001 [0.0, 1.0) 0 0 0 \n",
- " [1.0, 2.0) 0 0 0 \n",
- " [2.0, 3.0) 1 0 0 \n",
- " [3.0, 4.0) 0 0 0 \n",
- "200010 [0.0, 1.0) 0 0 0 \n",
- "... ... ... ... \n",
- "201125 [3.0, 4.0) 1 0 0 \n",
- "201128 [0.0, 1.0) 0 0 0 \n",
- " [1.0, 2.0) 1 1 0 \n",
- " [2.0, 3.0) 1 0 0 \n",
- " [3.0, 4.0) 1 0 0 \n",
+ "200001 [0.0, 1.0) 1 0 0 \n",
+ " [1.0, 2.0) 1 0 0 \n",
+ " [2.0, 3.0) 1 0 0 \n",
+ " [3.0, 4.0) 0 0 0 \n",
+ "200010 [0.0, 1.0) 0 0 0 \n",
+ "... ... ... ... \n",
+ "201125 [3.0, 4.0) 1 1 0 \n",
+ "201128 [0.0, 1.0) 0 0 0 \n",
+ " [1.0, 2.0) 1 1 1 \n",
+ " [2.0, 3.0) 1 1 0 \n",
+ " [3.0, 4.0) 1 1 0 \n",
+ "\n",
+ " SysBP_max>141.0 \n",
+ "ID t_range \n",
+ "200001 [0.0, 1.0) 0 \n",
+ " [1.0, 2.0) 0 \n",
+ " [2.0, 3.0) 0 \n",
+ " [3.0, 4.0) 0 \n",
+ "200010 [0.0, 1.0) 0 \n",
+ "... ... \n",
+ "201125 [3.0, 4.0) 0 \n",
+ "201128 [0.0, 1.0) 0 \n",
+ " [1.0, 2.0) 0 \n",
+ " [2.0, 3.0) 0 \n",
+ " [3.0, 4.0) 0 \n",
"\n",
"[800 rows x 3587 columns]"
]
@@ -2507,11 +2463,11 @@
"--------------------------------------------------------------------------------\n",
"(N × ^d) table :\t (200, 12)\n",
"number of missing entries :\t 4 out of 2400 total\n",
- "Time elapsed: 0.018502 seconds\n",
+ "Time elapsed: 0.011708 seconds\n",
"\n",
"Output\n",
"S_all, binary features :\t (200, 76)\n",
- "Time elapsed: 0.116800 seconds\n",
+ "Time elapsed: 0.123038 seconds\n",
"\n",
"--------------------------------------------------------------------------------\n",
"3-A) Post-filter time-invariant data\n",
@@ -2519,11 +2475,11 @@
"Original : 76\n",
"Nearly-constant: 0\n",
"Correlated : 7\n",
- "Time elapsed: 0.121063 seconds\n",
+ "Time elapsed: 0.126716 seconds\n",
"\n",
"Output\n",
"S: shape=(200, 69), density=0.162\n",
- "Total time: 0.125685 seconds\n",
+ "Total time: 0.129411 seconds\n",
"\n",
"\n",
"--------------------------------------------------------------------------------\n",
@@ -2537,8 +2493,8 @@
"\n",
"Transforming each example...\n",
"Batches of size 100: 2\n",
- "100%|█████████████████████████████████████████████| 2/2 [00:30<00:00, 15.46s/it]\n",
- "\u001b[0m\u001b[0m\u001b[0m\u001b[0m\n",
+ "100%|█████████████████████████████████████████████| 2/2 [00:23<00:00, 11.65s/it]\n",
+ "\n",
"Parallel processing done\n",
"DONE: Transforming each example...\n",
"(freq) number of missing entries :\t 996 out of 200×4×5=4000 total\n",
@@ -2547,16 +2503,16 @@
"(non-freq) number of missing entries :\t 1510389 out of 200×4×1953=1562400 total\n",
"\n",
"(N × L × ^D) table :\t (200, 4, 1983)\n",
- "Time elapsed: 32.386383 seconds\n",
+ "Time elapsed: 24.511847 seconds\n",
"Discretizing features...\n",
"\n",
"Discretizing categorical features...\n",
- "100%|██████████████████████████████████████| 1990/1990 [00:10<00:00, 190.17it/s]\n",
- "\u001b[0m\u001b[0m\u001b[0m\u001b[0mFinished discretizing features\n",
+ "100%|██████████████████████████████████████| 1990/1990 [00:07<00:00, 266.00it/s]\n",
+ "Finished discretizing features\n",
"\n",
"Output\n",
"X_all: shape=(200, 4, 2588), density=0.582\n",
- "Time elapsed: 46.796057 seconds\n",
+ "Time elapsed: 34.279819 seconds\n",
"\n",
"--------------------------------------------------------------------------------\n",
"3-B) Post-filter time-dependent data\n",
@@ -2564,7 +2520,7 @@
"(200, 4, 2588) 0.5818387751159196\n",
"Original : 2588\n",
"Nearly-constant: 1064\n",
- "*** time: 10.0768461227417\n",
+ "*** time: 5.1737799644470215\n",
"/Users/shengputang/Developer/FIDDLE/FIDDLE/helpers.py:426: RuntimeWarning: invalid value encountered in sqrt\n",
" coeffs = C / np.sqrt(np.outer(d, d))\n",
"/Users/shengputang/Developer/FIDDLE/FIDDLE/helpers.py:426: RuntimeWarning: divide by zero encountered in true_divide\n",
@@ -2574,18 +2530,17 @@
"/Users/shengputang/Developer/FIDDLE/FIDDLE/helpers.py:376: RuntimeWarning: invalid value encountered in multiply\n",
" self.corr_matrix *= np.tri(*self.corr_matrix.shape)\n",
"Correlated : 310\n",
- "*** time: 16.394930124282837\n",
+ "*** time: 8.826726913452148\n",
"\n",
"Output\n",
"X: shape=(200, 4, 1214), density=0.366\n",
"(200, 4, 1214) 0.366085255354201\n",
- "Time elapsed: 63.195710 seconds\n",
+ "Time elapsed: 43.112199 seconds\n",
"\n",
"Output\n",
"X: shape=(200, 4, 1214), density=0.366\n",
- "Total time: 63.452329 seconds\n",
- "\n",
- "\u001b[0m"
+ "Total time: 43.318430 seconds\n",
+ "\n"
]
}
],
@@ -3656,7 +3611,7 @@
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
- "version": "3.8.6"
+ "version": "3.8.5"
}
},
"nbformat": 4,
diff --git a/tests/small_test/Run-docker.ipynb b/tests/small_test/Run-docker.ipynb
index a18976b..c56e7c2 100644
--- a/tests/small_test/Run-docker.ipynb
+++ b/tests/small_test/Run-docker.ipynb
@@ -77,11 +77,11 @@
"--------------------------------------------------------------------------------\n",
"(N × ^d) table :\t (4, 3)\n",
"number of missing entries :\t 3 out of 12 total\n",
- "Time elapsed: 0.044580 seconds\n",
+ "Time elapsed: 0.037138 seconds\n",
"\n",
"Output\n",
"S_all, binary features :\t (4, 6)\n",
- "Time elapsed: 0.274032 seconds\n",
+ "Time elapsed: 0.098682 seconds\n",
"\n",
"--------------------------------------------------------------------------------\n",
"2-B) Transform time-dependent data\n",
@@ -93,7 +93,7 @@
"k = 3 ['min', 'max', 'mean']\n",
"\n",
"Transforming each example...\n",
- "100%|█████████████████████████████████████████████| 4/4 [00:01<00:00, 3.60it/s]\n",
+ "100%|█████████████████████████████████████████████| 4/4 [00:00<00:00, 7.10it/s]\n",
"DONE: Transforming each example...\n",
"(freq) number of missing entries :\t 5 out of 4×4×1=16 total\n",
"(freq) number of imputed entries :\t 4\n",
@@ -101,16 +101,16 @@
"(non-freq) number of missing entries :\t 41 out of 4×4×3=48 total\n",
"\n",
"(N × L × ^D) table :\t (4, 4, 9)\n",
- "Time elapsed: 1.221479 seconds\n",
+ "Time elapsed: 0.652093 seconds\n",
"Discretizing features...\n",
"\n",
"Discretizing categorical features...\n",
- "100%|████████████████████████████████████████████| 9/9 [00:00<00:00, 132.10it/s]\n",
+ "100%|████████████████████████████████████████████| 9/9 [00:00<00:00, 189.23it/s]\n",
"Finished discretizing features\n",
"\n",
"Output\n",
"X_all: shape=(4, 4, 12), density=0.599\n",
- "Time elapsed: 1.397339 seconds\n"
+ "Time elapsed: 0.780475 seconds\n"
]
}
],
@@ -705,11 +705,11 @@
"--------------------------------------------------------------------------------\n",
"(N × ^d) table :\t (4, 3)\n",
"number of missing entries :\t 3 out of 12 total\n",
- "Time elapsed: 0.057177 seconds\n",
+ "Time elapsed: 0.037977 seconds\n",
"\n",
"Output\n",
"S_all, binary features :\t (4, 10)\n",
- "Time elapsed: 0.212313 seconds\n",
+ "Time elapsed: 0.101355 seconds\n",
"\n",
"--------------------------------------------------------------------------------\n",
"2-B) Transform time-dependent data\n",
@@ -721,7 +721,7 @@
"k = 3 ['min', 'max', 'mean']\n",
"\n",
"Transforming each example...\n",
- "100%|█████████████████████████████████████████████| 4/4 [00:01<00:00, 2.82it/s]\n",
+ "100%|█████████████████████████████████████████████| 4/4 [00:00<00:00, 6.19it/s]\n",
"DONE: Transforming each example...\n",
"(freq) number of missing entries :\t 5 out of 4×4×1=16 total\n",
"(freq) number of imputed entries :\t 4\n",
@@ -729,19 +729,19 @@
"(non-freq) number of missing entries :\t 41 out of 4×4×3=48 total\n",
"\n",
"(N × L × ^D) table :\t (4, 4, 9)\n",
- "Time elapsed: 1.567708 seconds\n",
+ "Time elapsed: 0.732639 seconds\n",
"Discretizing features...\n",
"\n",
"Processing 8 non-boolean variable columns...\n",
" Computing bin edges for numeric variables...\n",
- "100%|█████████████████████████████████████████████| 8/8 [00:00<00:00, 72.63it/s]\n",
+ "100%|████████████████████████████████████████████| 8/8 [00:00<00:00, 323.78it/s]\n",
" Discretizing variables to binary features\n",
- "100%|█████████████████████████████████████████████| 8/8 [00:00<00:00, 28.40it/s]\n",
+ "100%|████████████████████████████████████████████| 8/8 [00:00<00:00, 110.27it/s]\n",
"Finished discretizing features\n",
"\n",
"Output\n",
"X_all: shape=(4, 4, 29), density=0.203\n",
- "Time elapsed: 2.102018 seconds\n"
+ "Time elapsed: 0.880507 seconds\n"
]
}
],
@@ -1627,11 +1627,11 @@
"--------------------------------------------------------------------------------\n",
"(N × ^d) table :\t (4, 3)\n",
"number of missing entries :\t 3 out of 12 total\n",
- "Time elapsed: 0.047925 seconds\n",
+ "Time elapsed: 0.023125 seconds\n",
"\n",
"Output\n",
"S_all, binary features :\t (4, 10)\n",
- "Time elapsed: 0.147781 seconds\n",
+ "Time elapsed: 0.106754 seconds\n",
"\n",
"--------------------------------------------------------------------------------\n",
"2-B) Transform time-dependent data\n",
@@ -1643,7 +1643,7 @@
"k = 3 ['min', 'max', 'mean']\n",
"\n",
"Transforming each example...\n",
- "100%|█████████████████████████████████████████████| 4/4 [00:01<00:00, 3.53it/s]\n",
+ "100%|█████████████████████████████████████████████| 4/4 [00:00<00:00, 4.61it/s]\n",
"DONE: Transforming each example...\n",
"(freq) number of missing entries :\t 5 out of 4×4×1=16 total\n",
"(freq) number of imputed entries :\t 4\n",
@@ -1651,19 +1651,19 @@
"(non-freq) number of missing entries :\t 41 out of 4×4×3=48 total\n",
"\n",
"(N × L × ^D) table :\t (4, 4, 9)\n",
- "Time elapsed: 1.239074 seconds\n",
+ "Time elapsed: 0.947634 seconds\n",
"Discretizing features...\n",
"\n",
"Processing 8 non-boolean variable columns...\n",
" Computing bin edges for numeric variables...\n",
- "100%|████████████████████████████████████████████| 8/8 [00:00<00:00, 165.76it/s]\n",
+ "100%|████████████████████████████████████████████| 8/8 [00:00<00:00, 190.83it/s]\n",
" Discretizing variables to binary features\n",
- "100%|█████████████████████████████████████████████| 8/8 [00:00<00:00, 24.97it/s]\n",
+ "100%|█████████████████████████████████████████████| 8/8 [00:00<00:00, 46.71it/s]\n",
"Finished discretizing features\n",
"\n",
"Output\n",
"X_all: shape=(4, 4, 29), density=0.474\n",
- "Time elapsed: 1.718451 seconds\n"
+ "Time elapsed: 1.240619 seconds\n"
]
}
],
@@ -2465,7 +2465,7 @@
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
- "version": "3.8.6"
+ "version": "3.8.5"
}
},
"nbformat": 4,
diff --git a/tests/small_test/Run.ipynb b/tests/small_test/Run.ipynb
index b9a073f..ac2f626 100644
--- a/tests/small_test/Run.ipynb
+++ b/tests/small_test/Run.ipynb
@@ -2484,7 +2484,7 @@
},
{
"cell_type": "code",
- "execution_count": 11,
+ "execution_count": 1,
"metadata": {},
"outputs": [],
"source": [
@@ -2493,7 +2493,7 @@
},
{
"cell_type": "code",
- "execution_count": 12,
+ "execution_count": 2,
"metadata": {},
"outputs": [
{
@@ -2545,11 +2545,11 @@
"--------------------------------------------------------------------------------\n",
"(N × ^d) table :\t (4, 3)\n",
"number of missing entries :\t 3 out of 12 total\n",
- "Time elapsed: 0.018871 seconds\n",
+ "Time elapsed: 0.015474 seconds\n",
"\n",
"Output\n",
- "s_all, binary features :\t (4, 10)\n",
- "Time elapsed: 0.061661 seconds\n",
+ "S_all, binary features :\t (4, 10)\n",
+ "Time elapsed: 0.057708 seconds\n",
"\n",
"--------------------------------------------------------------------------------\n",
"2-B) Transform time-dependent data\n",
@@ -2561,7 +2561,7 @@
"k = 3 ['min', 'max', 'mean']\n",
"\n",
"Transforming each example...\n",
- "100%|█████████████████████████████████████████████| 4/4 [00:00<00:00, 5.89it/s]\n",
+ "100%|█████████████████████████████████████████████| 4/4 [00:00<00:00, 8.43it/s]\n",
"DONE: Transforming each example...\n",
"(freq) number of missing entries :\t 5 out of 4×4×1=16 total\n",
"(freq) number of imputed entries :\t 4\n",
@@ -2569,20 +2569,19 @@
"(non-freq) number of missing entries :\t 41 out of 4×4×3=48 total\n",
"\n",
"(N × L × ^D) table :\t (4, 4, 9)\n",
- "Time elapsed: 0.735244 seconds\n",
+ "Time elapsed: 0.529465 seconds\n",
"Discretizing features...\n",
"\n",
"Processing 8 non-boolean variable columns...\n",
" Computing bin edges for numeric variables...\n",
- "100%|████████████████████████████████████████████| 8/8 [00:00<00:00, 313.93it/s]\n",
+ "100%|████████████████████████████████████████████| 8/8 [00:00<00:00, 501.69it/s]\n",
" Discretizing variables to binary features\n",
- "100%|█████████████████████████████████████████████| 8/8 [00:00<00:00, 38.42it/s]\n",
+ "100%|█████████████████████████████████████████████| 8/8 [00:00<00:00, 82.33it/s]\n",
"Finished discretizing features\n",
"\n",
"Output\n",
"X_all: shape=(4, 4, 29), density=0.420\n",
- "Time elapsed: 0.989317 seconds\n",
- "\u001b[0m"
+ "Time elapsed: 0.665394 seconds\n"
]
}
],
@@ -2601,7 +2600,7 @@
},
{
"cell_type": "code",
- "execution_count": 13,
+ "execution_count": 3,
"metadata": {},
"outputs": [
{
@@ -2625,11 +2624,11 @@
" \n",
" \n",
" | \n",
- " AGE_value>=33.0 | \n",
- " AGE_value>=35.8 | \n",
- " AGE_value>=38.6 | \n",
- " AGE_value>=42.0 | \n",
- " AGE_value>=46.0 | \n",
+ " AGE_value>33.0 | \n",
+ " AGE_value>35.8 | \n",
+ " AGE_value>38.6 | \n",
+ " AGE_value>42.0 | \n",
+ " AGE_value>46.0 | \n",
" ROOM_value__101 | \n",
" ROOM_value__102 | \n",
" ROOM_value__103 | \n",
@@ -2708,19 +2707,19 @@
""
],
"text/plain": [
- " AGE_value>=33.0 AGE_value>=35.8 AGE_value>=38.6 AGE_value>=42.0 \\\n",
- "ID \n",
- "1 1 1 1 1 \n",
- "2 0 0 0 0 \n",
- "3 1 1 1 0 \n",
- "4 0 0 0 0 \n",
+ " AGE_value>33.0 AGE_value>35.8 AGE_value>38.6 AGE_value>42.0 \\\n",
+ "ID \n",
+ "1 1 1 1 1 \n",
+ "2 0 0 0 0 \n",
+ "3 1 1 1 0 \n",
+ "4 0 0 0 0 \n",
"\n",
- " AGE_value>=46.0 ROOM_value__101 ROOM_value__102 ROOM_value__103 \\\n",
- "ID \n",
- "1 1 1 0 0 \n",
- "2 0 0 1 0 \n",
- "3 0 0 0 1 \n",
- "4 0 0 0 0 \n",
+ " AGE_value>46.0 ROOM_value__101 ROOM_value__102 ROOM_value__103 \\\n",
+ "ID \n",
+ "1 1 1 0 0 \n",
+ "2 0 0 1 0 \n",
+ "3 0 0 0 1 \n",
+ "4 0 0 0 0 \n",
"\n",
" SEX_value_F SEX_value_M \n",
"ID \n",
@@ -2762,20 +2761,20 @@
" DRUG_A_ROUTE_value_Oral | \n",
" LAB_X_value_5 | \n",
" LAB_X_value_<1 | \n",
- " HR_delta_time>=0.0 | \n",
- " HR_delta_time>=1.0 | \n",
- " HR_value>=61.0 | \n",
+ " HR_delta_time>0.0 | \n",
+ " HR_delta_time>1.0 | \n",
+ " HR_value>61.0 | \n",
" ... | \n",
- " HR_max>=61.0 | \n",
- " HR_max>=69.2 | \n",
- " HR_max>=73.6 | \n",
- " HR_max>=76.2 | \n",
- " HR_max>=82.00000000000001 | \n",
- " HR_mean>=60.333333333333336 | \n",
- " HR_mean>=68.80000000000001 | \n",
- " HR_mean>=73.6 | \n",
- " HR_mean>=75.2 | \n",
- " HR_mean>=82.00000000000001 | \n",
+ " HR_max>61.0 | \n",
+ " HR_max>69.2 | \n",
+ " HR_max>73.6 | \n",
+ " HR_max>76.2 | \n",
+ " HR_max>82.00000000000001 | \n",
+ " HR_mean>60.333333333333336 | \n",
+ " HR_mean>68.80000000000001 | \n",
+ " HR_mean>73.6 | \n",
+ " HR_mean>75.2 | \n",
+ " HR_mean>82.00000000000001 | \n",
"
\n",
" \n",
" ID | \n",
@@ -3236,100 +3235,100 @@
" [2.0, 3.0) 0 0 0 \n",
" [3.0, 4.0) 0 0 0 \n",
"\n",
- " LAB_X_value_<1 HR_delta_time>=0.0 HR_delta_time>=1.0 \\\n",
- "ID t_range \n",
- "1 [0.0, 1.0) 0 0 0 \n",
- " [1.0, 2.0) 0 0 0 \n",
- " [2.0, 3.0) 1 0 0 \n",
- " [3.0, 4.0) 0 0 0 \n",
- "2 [0.0, 1.0) 0 0 0 \n",
- " [1.0, 2.0) 0 1 0 \n",
- " [2.0, 3.0) 0 0 0 \n",
- " [3.0, 4.0) 0 0 0 \n",
- "3 [0.0, 1.0) 0 0 0 \n",
- " [1.0, 2.0) 0 0 0 \n",
- " [2.0, 3.0) 0 1 0 \n",
- " [3.0, 4.0) 0 1 1 \n",
- "4 [0.0, 1.0) 0 0 0 \n",
- " [1.0, 2.0) 0 1 0 \n",
- " [2.0, 3.0) 0 0 0 \n",
- " [3.0, 4.0) 0 0 0 \n",
+ " LAB_X_value_<1 HR_delta_time>0.0 HR_delta_time>1.0 \\\n",
+ "ID t_range \n",
+ "1 [0.0, 1.0) 0 0 0 \n",
+ " [1.0, 2.0) 0 0 0 \n",
+ " [2.0, 3.0) 1 0 0 \n",
+ " [3.0, 4.0) 0 0 0 \n",
+ "2 [0.0, 1.0) 0 0 0 \n",
+ " [1.0, 2.0) 0 1 0 \n",
+ " [2.0, 3.0) 0 0 0 \n",
+ " [3.0, 4.0) 0 0 0 \n",
+ "3 [0.0, 1.0) 0 0 0 \n",
+ " [1.0, 2.0) 0 0 0 \n",
+ " [2.0, 3.0) 0 1 0 \n",
+ " [3.0, 4.0) 0 1 1 \n",
+ "4 [0.0, 1.0) 0 0 0 \n",
+ " [1.0, 2.0) 0 1 0 \n",
+ " [2.0, 3.0) 0 0 0 \n",
+ " [3.0, 4.0) 0 0 0 \n",
"\n",
- " HR_value>=61.0 ... HR_max>=61.0 HR_max>=69.2 HR_max>=73.6 \\\n",
- "ID t_range ... \n",
- "1 [0.0, 1.0) 1 ... 1 1 0 \n",
- " [1.0, 2.0) 1 ... 1 1 0 \n",
- " [2.0, 3.0) 1 ... 1 1 1 \n",
- " [3.0, 4.0) 1 ... 1 1 1 \n",
- "2 [0.0, 1.0) 0 ... 0 0 0 \n",
- " [1.0, 2.0) 0 ... 0 0 0 \n",
- " [2.0, 3.0) 1 ... 1 1 1 \n",
- " [3.0, 4.0) 1 ... 1 1 1 \n",
- "3 [0.0, 1.0) 0 ... 0 0 0 \n",
- " [1.0, 2.0) 1 ... 1 1 1 \n",
- " [2.0, 3.0) 1 ... 1 1 1 \n",
- " [3.0, 4.0) 1 ... 1 1 1 \n",
- "4 [0.0, 1.0) 1 ... 1 1 1 \n",
- " [1.0, 2.0) 1 ... 1 1 1 \n",
- " [2.0, 3.0) 1 ... 1 0 0 \n",
- " [3.0, 4.0) 1 ... 1 1 0 \n",
+ " HR_value>61.0 ... HR_max>61.0 HR_max>69.2 HR_max>73.6 \\\n",
+ "ID t_range ... \n",
+ "1 [0.0, 1.0) 1 ... 1 1 0 \n",
+ " [1.0, 2.0) 1 ... 1 1 0 \n",
+ " [2.0, 3.0) 1 ... 1 1 1 \n",
+ " [3.0, 4.0) 1 ... 1 1 1 \n",
+ "2 [0.0, 1.0) 0 ... 0 0 0 \n",
+ " [1.0, 2.0) 0 ... 0 0 0 \n",
+ " [2.0, 3.0) 1 ... 1 1 1 \n",
+ " [3.0, 4.0) 1 ... 1 1 1 \n",
+ "3 [0.0, 1.0) 0 ... 0 0 0 \n",
+ " [1.0, 2.0) 1 ... 1 1 1 \n",
+ " [2.0, 3.0) 1 ... 1 1 1 \n",
+ " [3.0, 4.0) 1 ... 1 1 1 \n",
+ "4 [0.0, 1.0) 1 ... 1 1 1 \n",
+ " [1.0, 2.0) 1 ... 1 1 1 \n",
+ " [2.0, 3.0) 1 ... 1 0 0 \n",
+ " [3.0, 4.0) 1 ... 1 1 0 \n",
"\n",
- " HR_max>=76.2 HR_max>=82.00000000000001 \\\n",
- "ID t_range \n",
- "1 [0.0, 1.0) 0 0 \n",
- " [1.0, 2.0) 0 0 \n",
- " [2.0, 3.0) 0 0 \n",
- " [3.0, 4.0) 0 0 \n",
- "2 [0.0, 1.0) 0 0 \n",
- " [1.0, 2.0) 0 0 \n",
- " [2.0, 3.0) 1 0 \n",
- " [3.0, 4.0) 0 0 \n",
- "3 [0.0, 1.0) 0 0 \n",
- " [1.0, 2.0) 1 1 \n",
- " [2.0, 3.0) 1 1 \n",
- " [3.0, 4.0) 1 1 \n",
- "4 [0.0, 1.0) 1 0 \n",
- " [1.0, 2.0) 1 0 \n",
- " [2.0, 3.0) 0 0 \n",
- " [3.0, 4.0) 0 0 \n",
+ " HR_max>76.2 HR_max>82.00000000000001 \\\n",
+ "ID t_range \n",
+ "1 [0.0, 1.0) 0 0 \n",
+ " [1.0, 2.0) 0 0 \n",
+ " [2.0, 3.0) 0 0 \n",
+ " [3.0, 4.0) 0 0 \n",
+ "2 [0.0, 1.0) 0 0 \n",
+ " [1.0, 2.0) 0 0 \n",
+ " [2.0, 3.0) 1 0 \n",
+ " [3.0, 4.0) 0 0 \n",
+ "3 [0.0, 1.0) 0 0 \n",
+ " [1.0, 2.0) 1 1 \n",
+ " [2.0, 3.0) 1 1 \n",
+ " [3.0, 4.0) 1 1 \n",
+ "4 [0.0, 1.0) 1 0 \n",
+ " [1.0, 2.0) 1 0 \n",
+ " [2.0, 3.0) 0 0 \n",
+ " [3.0, 4.0) 0 0 \n",
"\n",
- " HR_mean>=60.333333333333336 HR_mean>=68.80000000000001 \\\n",
- "ID t_range \n",
- "1 [0.0, 1.0) 1 1 \n",
- " [1.0, 2.0) 1 1 \n",
- " [2.0, 3.0) 1 1 \n",
- " [3.0, 4.0) 1 1 \n",
- "2 [0.0, 1.0) 0 0 \n",
- " [1.0, 2.0) 1 0 \n",
- " [2.0, 3.0) 1 1 \n",
- " [3.0, 4.0) 1 1 \n",
- "3 [0.0, 1.0) 0 0 \n",
- " [1.0, 2.0) 1 1 \n",
- " [2.0, 3.0) 1 1 \n",
- " [3.0, 4.0) 1 1 \n",
- "4 [0.0, 1.0) 1 1 \n",
- " [1.0, 2.0) 1 1 \n",
- " [2.0, 3.0) 1 0 \n",
- " [3.0, 4.0) 1 1 \n",
+ " HR_mean>60.333333333333336 HR_mean>68.80000000000001 \\\n",
+ "ID t_range \n",
+ "1 [0.0, 1.0) 1 1 \n",
+ " [1.0, 2.0) 1 1 \n",
+ " [2.0, 3.0) 1 1 \n",
+ " [3.0, 4.0) 1 1 \n",
+ "2 [0.0, 1.0) 0 0 \n",
+ " [1.0, 2.0) 1 0 \n",
+ " [2.0, 3.0) 1 1 \n",
+ " [3.0, 4.0) 1 1 \n",
+ "3 [0.0, 1.0) 0 0 \n",
+ " [1.0, 2.0) 1 1 \n",
+ " [2.0, 3.0) 1 1 \n",
+ " [3.0, 4.0) 1 1 \n",
+ "4 [0.0, 1.0) 1 1 \n",
+ " [1.0, 2.0) 1 1 \n",
+ " [2.0, 3.0) 1 0 \n",
+ " [3.0, 4.0) 1 1 \n",
"\n",
- " HR_mean>=73.6 HR_mean>=75.2 HR_mean>=82.00000000000001 \n",
- "ID t_range \n",
- "1 [0.0, 1.0) 0 0 0 \n",
- " [1.0, 2.0) 0 0 0 \n",
- " [2.0, 3.0) 1 0 0 \n",
- " [3.0, 4.0) 1 0 0 \n",
- "2 [0.0, 1.0) 0 0 0 \n",
- " [1.0, 2.0) 0 0 0 \n",
- " [2.0, 3.0) 1 1 0 \n",
- " [3.0, 4.0) 1 0 0 \n",
- "3 [0.0, 1.0) 0 0 0 \n",
- " [1.0, 2.0) 1 1 1 \n",
- " [2.0, 3.0) 1 1 1 \n",
- " [3.0, 4.0) 1 1 1 \n",
- "4 [0.0, 1.0) 1 1 0 \n",
- " [1.0, 2.0) 1 1 0 \n",
- " [2.0, 3.0) 0 0 0 \n",
- " [3.0, 4.0) 0 0 0 \n",
+ " HR_mean>73.6 HR_mean>75.2 HR_mean>82.00000000000001 \n",
+ "ID t_range \n",
+ "1 [0.0, 1.0) 0 0 0 \n",
+ " [1.0, 2.0) 0 0 0 \n",
+ " [2.0, 3.0) 1 0 0 \n",
+ " [3.0, 4.0) 1 0 0 \n",
+ "2 [0.0, 1.0) 0 0 0 \n",
+ " [1.0, 2.0) 0 0 0 \n",
+ " [2.0, 3.0) 1 1 0 \n",
+ " [3.0, 4.0) 1 0 0 \n",
+ "3 [0.0, 1.0) 0 0 0 \n",
+ " [1.0, 2.0) 1 1 1 \n",
+ " [2.0, 3.0) 1 1 1 \n",
+ " [3.0, 4.0) 1 1 1 \n",
+ "4 [0.0, 1.0) 1 1 0 \n",
+ " [1.0, 2.0) 1 1 0 \n",
+ " [2.0, 3.0) 0 0 0 \n",
+ " [3.0, 4.0) 0 0 0 \n",
"\n",
"[16 rows x 29 columns]"
]
@@ -3382,7 +3381,7 @@
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
- "version": "3.8.6"
+ "version": "3.8.5"
}
},
"nbformat": 4,