PufferAI
diff --git a/‎build.sh‎
Lines changed: 2 additions & 2 deletions b/‎build.sh‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎constellation/cache_data.py‎
Lines changed: 37 additions & 25 deletions b/‎constellation/cache_data.py‎
Lines changed: 37 additions & 25 deletions
@@ -34,6 +34,8 @@ CLANG_WARN="\
     -Wno-incompatible-pointer-types-discards-qualifiers \
     -Wno-error=array-parameter"
 
+PLATFORM="$(uname -s)"
+
 if [ -n "$DEBUG" ] || [ "$MODE" = "local" ]; then
     CLANG_OPT="-g -O0 $CLANG_WARN"
     NVCC_OPT="-O0 -g"
@@ -48,8 +50,6 @@ fi
 # ============================================================================
 # Platform + dependencies
 # ============================================================================
-
-PLATFORM="$(uname -s)"
 if [ -d "ocean/$ENV" ]; then
     SRC_DIR="ocean/$ENV"
 elif [ -d "$ENV" ]; then
 
@@ -5,13 +5,13 @@
 import os
 
 env_names = sorted([
-    #'breakout',
+    'breakout',
     #'impulse_wars',
     #'pacman',
     #'tetris',
     #'g2048',
     #'moba',
-    #'pong',
+    'pong',
     #'tower_climb',
     #'grid',
     'nmmo3',
@@ -35,7 +35,7 @@
     'train/eps',
     'train/prio_alpha',
     'train/prio_beta0',
-    #'train/horizon',
+    'train/horizon',
     'train/replay_ratio',
     'train/minibatch_size',
     'policy/hidden_size',
@@ -101,10 +101,6 @@ def cached_load(path, env_name, cache):
         for k in list(exp['metrics'].keys()):
             if 'loss' in k:
                 del exp['metrics'][k]
-        data_len = len(exp['metrics']['agent_steps'])
-        if data_len > 100:
-            print(f'Skipping {fpath} (len={data_len})')
-            continue
 
         if num_metrics == 0:
             num_metrics = len(exp['metrics'])
@@ -114,7 +110,6 @@ def cached_load(path, env_name, cache):
         metrics = exp['metrics']
 
         if len(metrics) != num_metrics:
-            breakpoint()
             print(f'Skipping {fpath} (num_metrics={len(metrics)} != {num_metrics})')
             continue
 
@@ -132,7 +127,6 @@ def cached_load(path, env_name, cache):
                 break
 
         if skip:
-            breakpoint()
             print(f'Skipping {fpath} (bad data)')
             continue
 
@@ -151,31 +145,34 @@ def cached_load(path, env_name, cache):
 
         for hyper in HYPERS:
             prefix, suffix = hyper.split('/')
-            if prefix not in sweep_metadata:
-                continue
+            #if prefix not in sweep_metadata:
+            #    continue
 
             group = sweep_metadata[prefix]
-            if suffix not in group:
-                continue
+            #if suffix not in group:
+            #    continue
 
-            param = group[suffix]
 
             key = f'{prefix}/{suffix}_norm'
             if key not in data:
                 data[key] = []
 
-            mmin = param['min']
-            mmax = param['max']
-            dist = param['distribution']
-            val = exp[prefix][suffix]
+            if suffix in group:
+                param = group[suffix]
+                mmin = param['min']
+                mmax = param['max']
+                dist = param['distribution']
+                val = exp[prefix][suffix]
 
-            if 'log' in dist or 'pow2' in dist:
-                mmin = np.log(mmin)
-                mmax = np.log(mmax)
-                val = np.log(val)
+                if 'log' in dist or 'pow2' in dist:
+                    mmin = np.log(mmin)
+                    mmax = np.log(mmax)
+                    val = np.log(val)
 
-            norm = (val - mmin) / (mmax - mmin)
-            data[key].append([norm]*n)
+                norm = (val - mmin) / (mmax - mmin)
+                data[key].append([norm]*n)
+            else:
+                data[key].append([1]*n)
 
     for k, v in data.items():
         data[k] = [item for sublist in v for item in sublist]
@@ -255,26 +252,41 @@ def compute_tsne():
     row = 0
     for env in env_names:
         sz = len(all_data[env]['agent_steps'])
+        all_data[env]['tsne1'] = reduced[row:row+sz, 0].tolist()
+        all_data[env]['tsne2'] = reduced[row:row+sz, 1].tolist()
+
+        '''
         if reduced is not None:
             all_data[env]['tsne1'] = reduced[row:row+sz, 0].tolist()
             all_data[env]['tsne2'] = reduced[row:row+sz, 1].tolist()
         else:
             all_data[env]['tsne1'] = np.random.rand(sz).tolist()
             all_data[env]['tsne2'] = np.random.rand(sz).tolist()
+        '''
 
         row += sz
         print(f'Env {env} has {sz} points')
 
     for env in all_data:
         dat = all_data[env]
-        dat = {k: v for k, v in dat.items() if k in ALL_KEYS}
+        dat = {k: v for k, v in dat.items() if isinstance(v, list)
+                and len(v) > 0 and isinstance(v[0], (int, float))
+                and (k == 'train/max_grad_norm' or not k.endswith('_norm'))}
         all_data[env] = dat
         for k, v in dat.items():
             try:
                 print(f'{env}/{k}: {len(v), min(v), max(v)}')
             except:
                 print(f'{env}/{k}: {len(v)}')
 
+    for env in all_data:
+        for k, v in all_data[env].items():
+            if isinstance(v, list):
+                try:
+                    all_data[env][k] = ','.join([f'{x:.6g}' for x in v])
+                except:
+                    breakpoint()
+
     json.dump(all_data, open('constellation/default.json', 'w'))
 
 if __name__ == '__main__':