From c517944ab8835abc8ed19b98f7acb296d1f38912 Mon Sep 17 00:00:00 2001
From: Hongyu Ren <hyren@cs.stanford.edu>
Date: Sun, 14 Nov 2021 00:16:59 +0000
Subject: [PATCH 1/5] make evaluation step consistent between 1p and multihop

---
 smore/training/train_process.py | 24 ++++++++----------------
 1 file changed, 8 insertions(+), 16 deletions(-)

diff --git a/smore/training/train_process.py b/smore/training/train_process.py
index 05b0810..9f83deb 100644
--- a/smore/training/train_process.py
+++ b/smore/training/train_process.py
@@ -98,7 +98,7 @@ def test_step_mp(model, args, train_sampler, test_dataloader, result_buffer, tra
     rank = dist.get_rank()
     step = 0
     total_steps = len(test_dataloader)
-    logs = collections.defaultdict(list)
+    logs = collections.defaultdict(collections.Counter)
     all_embed = None
     negative_sample_bias = None
 
@@ -153,27 +153,19 @@ def test_step_mp(model, args, train_sampler, test_dataloader, result_buffer, tra
                     h10 = torch.mean((cur_ranking <= 10).to(torch.float)).item()
                     h1m = ((cur_ranking[0] == 1).to(torch.float)).item()
 
-                logs[query_structure].append({
-                    'MRR': mrr,
-                    'HITS1': h1,
-                    'HITS3': h3,
-                    'HITS10': h10,
-                    'HITS1max': h1m,
-                    'num_hard_answer': num_hard,
-                })
+                logs[query_structure]['MRR'] += mrr
+                logs[query_structure]['HITS1'] += h1
+                logs[query_structure]['HITS3'] += h3
+                logs[query_structure]['HITS10'] += h10
+                logs[query_structure]['HITS1max'] += h1m
+                logs[query_structure]['num_hard_answer'] += 1
+                logs[query_structure]['num_queries'] += 1
 
             if step % args.test_log_steps == 0:
                 logging.info('Evaluating the model... (%d/%d)' % (step, total_steps))
 
             step += 1
 
-    # metrics = collections.defaultdict(lambda: collections.defaultdict(int))
-    # for query_structure in logs:
-    #     for metric in logs[query_structure][0].keys():
-    #         if metric in ['num_hard_answer']:
-    #             continue
-    #         metrics[query_structure][metric] = sum([log[metric] for log in logs[query_structure]])/len(logs[query_structure])
-    #     metrics[query_structure]['num_queries'] = len(logs[query_structure])
     result_buffer.put((logs, train_step))
 
 

From c1141da1d48ed8d6805bfb98c4a4a71955197fa6 Mon Sep 17 00:00:00 2001
From: Hongyu Ren <hyren@cs.stanford.edu>
Date: Mon, 15 Nov 2021 06:57:04 +0000
Subject: [PATCH 2/5] fix featurized bug

---
 smore/models/kg_reasoning.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/smore/models/kg_reasoning.py b/smore/models/kg_reasoning.py
index 82068f9..1c3cbbc 100644
--- a/smore/models/kg_reasoning.py
+++ b/smore/models/kg_reasoning.py
@@ -89,7 +89,7 @@ def attach_feature(self, name, feat, gpu_id, is_sparse):
         else:
             device = 'cuda:{}'.format(gpu_id)
         if is_sparse:
-            feat_read = EmbeddingReadOnly(feat, gpu_id=gpu_id, target_dtype=torch.float32)
+            feat_read = EmbeddingReadOnly(feat, gpu_id=gpu_id, target_dtype=feat.dtype)
             setattr(self, "%s_feat" % name, feat_read)
         else:
             setattr(self, "%s_feat" % name, feat.to(device))

From fdcd9ae62ca0e464c46b4e7542e56b2c2beabcc6 Mon Sep 17 00:00:00 2001
From: hyren <2950128563@qq.com>
Date: Mon, 14 Feb 2022 00:39:03 -0800
Subject: [PATCH 3/5] remove target dtype

---
 smore/common/embedding/embed_rw.py | 17 +++--------------
 smore/models/kg_reasoning.py       |  2 +-
 2 files changed, 4 insertions(+), 15 deletions(-)

diff --git a/smore/common/embedding/embed_rw.py b/smore/common/embedding/embed_rw.py
index 9698220..2084828 100644
--- a/smore/common/embedding/embed_rw.py
+++ b/smore/common/embedding/embed_rw.py
@@ -29,19 +29,11 @@ def sync(self):
 
 
 class EmbeddingReadOnly(object):
-    def __init__(self, embed, gpu_id=-1, target_dtype=None):
+    def __init__(self, embed, gpu_id=-1):
         super(EmbeddingReadOnly, self).__init__()
         self.embed = embed.data
         self.gpu_id = gpu_id
         self.embed_dim = embed.shape[1]
-        if target_dtype is None:
-            self.target_dtype = embed.dtype
-        else:
-            self.target_dtype = target_dtype
-        if target_dtype != embed.dtype:
-            self.type_cast = lambda x: x.type(self.target_dtype)
-        else:
-            self.type_cast = lambda x: x
         if gpu_id == -1:
             self.device = 'cpu'
         else:
@@ -74,15 +66,13 @@ def read(self, indices, name=None):
             t = self.embed.to(self.device)
             t.job_handle = self.dummy_job
             return t
-        if indices.numel() == self.embed.shape[0] and self.embed.is_cuda:  # TODO: make it more explicit
-            return self.embed
         if not self.embed.is_cuda:
             if name is not None and indices.numel() != self.embed.shape[0]:  # TODO: make it more explicit
                 return self.async_read(indices, name)
             for key in self.last_write_jobs:
                 self.last_write_jobs[key].sync()
         indices = indices.view(-1)
-        submat = self.type_cast(self.embed[indices].to(self.device))
+        submat = self.embed[indices].to(self.device)
         submat.job_handle = self.dummy_job
         return submat
 
@@ -97,7 +87,7 @@ def async_read(self, indices, name):
                                            self.embed,
                                            buf,
                                            out)
-            submat = self.type_cast(out[:indices.shape[0]])
+            submat = out[:indices.shape[0]]
             submat.job_handle = job_handle
         return submat
 
@@ -106,7 +96,6 @@ class EmbeddingRW(EmbeddingReadOnly):
     def __init__(self, embed, gpu_id=-1):
         super(EmbeddingRW, self).__init__(embed, gpu_id)
         self.write_thread_pool = self.read_thread_pool
-        assert self.target_dtype == self.embed.dtype 
         self.write_buf = {}        
         self.write_src_cache = {}
 
diff --git a/smore/models/kg_reasoning.py b/smore/models/kg_reasoning.py
index 1c3cbbc..4bc78c8 100644
--- a/smore/models/kg_reasoning.py
+++ b/smore/models/kg_reasoning.py
@@ -89,7 +89,7 @@ def attach_feature(self, name, feat, gpu_id, is_sparse):
         else:
             device = 'cuda:{}'.format(gpu_id)
         if is_sparse:
-            feat_read = EmbeddingReadOnly(feat, gpu_id=gpu_id, target_dtype=feat.dtype)
+            feat_read = EmbeddingReadOnly(feat, gpu_id=gpu_id)
             setattr(self, "%s_feat" % name, feat_read)
         else:
             setattr(self, "%s_feat" % name, feat.to(device))

From f7c5619c6c34c9ca80eb0f8ba2eb55df1d63b12c Mon Sep 17 00:00:00 2001
From: hyren <2950128563@qq.com>
Date: Mon, 14 Feb 2022 01:00:36 -0800
Subject: [PATCH 4/5] add automatic dataset downloading

---
 smore/common/util.py         | 76 +++++++++++++++++++++++++++++++++++-
 smore/training/main_train.py |  4 +-
 2 files changed, 77 insertions(+), 3 deletions(-)

diff --git a/smore/common/util.py b/smore/common/util.py
index 36d24a2..a385047 100755
--- a/smore/common/util.py
+++ b/smore/common/util.py
@@ -24,10 +24,15 @@
 from _thread import start_new_thread
 import traceback
 import logging
-import pdb
-
+import os
+from tqdm import tqdm
+import shutil
+import zipfile
+import urllib.request as ur
 from smore.common.config import name_query_dict, query_name_dict
 
+GBFACTOR = float(1 << 30)
+
 def cal_ent_loc(query_structure, idx):
     if query_structure[0] == '<':
         return cal_ent_loc(query_structure[1], idx)
@@ -236,6 +241,73 @@ def sample_negative_bidirectional(query, ent_in, ent_out, nent):
     pass
 
 
+def download_url(url, folder, log=True):
+    r"""Downloads the content of an URL to a specific folder.
+    Args:
+        url (string): The url.
+        folder (string): The folder.
+        log (bool, optional): If :obj:`False`, will not print anything to the
+            console. (default: :obj:`True`)
+    """
+
+    filename = url.rpartition('/')[2]
+    path = osp.join(folder, filename)
+
+    if osp.exists(path) and osp.getsize(path) > 0:  # pragma: no cover
+        if log:
+            print('Using exist file', filename)
+        return path
+
+    if log:
+        print('Downloading', url)
+
+    if not osp.exists(folder):
+        os.makedirs(folder)
+    data = ur.urlopen(url)
+
+    size = int(data.info()["Content-Length"])
+
+    chunk_size = 1024*1024
+    num_iter = int(size/chunk_size) + 2
+
+    downloaded_size = 0
+
+    try:
+        with open(path, 'wb') as f:
+            pbar = tqdm(range(num_iter))
+            for i in pbar:
+                chunk = data.read(chunk_size)
+                downloaded_size += len(chunk)
+                pbar.set_description("Downloaded {:.2f} GB".format(float(downloaded_size)/GBFACTOR))
+                f.write(chunk)
+    except:
+        if osp.exists(path):
+             os.remove(path)
+        raise RuntimeError('Stopped downloading due to interruption.')
+
+
+    return path
+
+def maybe_download_dataset(data_path):
+    data_name = data_path.split('/')[-1]
+    if data_name in ['FB15k', 'FB15k-237', 'NELL', "FB400k"]:
+        if not (osp.exists(data_path) and osp.exists(osp.join(data_path, "stats.txt"))):
+            url = "https://snap.stanford.edu/betae/%s.zip" % data_name
+            path = download_url(url, osp.split(osp.abspath(data_path))[0])
+            extract_zip(path, osp.split(osp.abspath(data_path))[0])
+            os.unlink(path)
+
+def extract_zip(path, folder):
+    r"""Extracts a zip archive to a specific folder.
+    Args:
+        path (string): The path to the tar archive.
+        folder (string): The folder.
+    """
+    print('Extracting', path)
+    with zipfile.ZipFile(path, 'r') as f:
+        f.extractall(folder)
+
+
 def thread_wrapped_func(func):
     """Wrapped func for torch.multiprocessing.Process.
 
diff --git a/smore/training/main_train.py b/smore/training/main_train.py
index 2eea6c2..c77c77c 100644
--- a/smore/training/main_train.py
+++ b/smore/training/main_train.py
@@ -33,7 +33,7 @@
 import math
 
 from smore.models import build_model
-from smore.common.util import flatten_query, list2tuple, parse_time, set_global_seed, eval_tuple, construct_graph, tuple2filterlist
+from smore.common.util import flatten_query, list2tuple, parse_time, set_global_seed, eval_tuple, construct_graph, tuple2filterlist, maybe_download_dataset
 from smore.common.config import parse_args, all_tasks, query_name_dict, name_query_dict
 from smore.common.embedding.embed_optimizer import get_optim_class
 from smore.cpp_sampler.sampler_clib import KGMem
@@ -305,6 +305,8 @@ def main(parser):
     set_global_seed(args.seed)
     gpus = [int(i) for i in args.gpus.split(".")]
     assert args.gpus == '.'.join([str(i) for i in range(len(gpus))]), 'only support continuous gpu ids starting from 0, please set CUDA_VISIBLE_DEVICES instead'
+    
+    maybe_download_dataset(args.data_path)
 
     setup_train_mode(args)
     

From be4d1a674351178707cf7210165c915c56acab43 Mon Sep 17 00:00:00 2001
From: hyren <2950128563@qq.com>
Date: Mon, 14 Feb 2022 01:14:58 -0800
Subject: [PATCH 5/5] update box/beta/vec scripts for the three small datset

---
 smore/training/beta_scripts/train_15k.sh  |  7 ++++---
 smore/training/beta_scripts/train_237.sh  |  9 +++++----
 smore/training/beta_scripts/train_nell.sh |  5 +++--
 smore/training/box_scripts/train_15k.sh   |  3 ++-
 smore/training/box_scripts/train_237.sh   |  9 +++++----
 smore/training/box_scripts/train_nell.sh  |  3 ++-
 smore/training/vec_scripts/train_15k.sh   |  5 +++--
 smore/training/vec_scripts/train_237.sh   | 11 ++++++-----
 smore/training/vec_scripts/train_nell.sh  |  7 ++++---
 9 files changed, 34 insertions(+), 25 deletions(-)

diff --git a/smore/training/beta_scripts/train_15k.sh b/smore/training/beta_scripts/train_15k.sh
index 1102035..940862d 100755
--- a/smore/training/beta_scripts/train_15k.sh
+++ b/smore/training/beta_scripts/train_15k.sh
@@ -21,19 +21,20 @@ eval_path=$data_folder/eval-betae
 export CUDA_VISIBLE_DEVICES=0,1,2,3
 
 #beta
-python ../main_train.py --do_test --gpus '0.1.2.3' \
+python ../main_train.py --do_train --do_test --gpus '0.1.2.3' \
  --data_path $data_folder --eval_path $eval_path \
  -n 1024 -b 512 -d 400 -g 60 \
  -a 0.5 -adv \
  -lr 0.0001 --max_steps 450001 --geo beta --valid_steps 15000 \
- -betam "(1600,2)" --tasks '1p.2p.3p.2i.3i.ip.pi.2u.up' --training_tasks '1p.2p.3p.2i.3i' \
+ -betam '(1600,2,fisher,0.055,layer,True)' --tasks '1p.2p.3p.2i.3i.ip.pi.2u.up' --training_tasks '1p.2p.3p.2i.3i' \
  --save_checkpoint_steps 150000 \
  --share_negative \
+ --logit_impl custom \
  --lr_schedule none \
  --sampler_type naive \
  --filter_test \
  --share_optim_stats \
- --port 29501 \
+ --port 29511 \
  --online_sample --prefix '../logs' --online_sample_mode '(500,0,w,wstruct,120)' \
  --train_online_mode '(single,3000,e,True,before)' --optim_mode '(aggr,adam,cpu,False,5)' --online_weighted_structure_prob '(20,20,20,10,10)' --print_on_screen \
  $@
diff --git a/smore/training/beta_scripts/train_237.sh b/smore/training/beta_scripts/train_237.sh
index bb58264..2b066e3 100755
--- a/smore/training/beta_scripts/train_237.sh
+++ b/smore/training/beta_scripts/train_237.sh
@@ -14,9 +14,9 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-data_name=FB15k-237-betae
+data_name=FB15k-237
 data_folder=$HOME/data/knowledge_graphs/$data_name
-eval_path=$data_folder/eval-original
+eval_path=$data_folder/eval-betae
 
 export CUDA_VISIBLE_DEVICES=0,1,2,3
 
@@ -26,14 +26,15 @@ python ../main_train.py --do_train --do_test --gpus '0.1.2.3' \
  -n 1024 -b 512 -d 400 -g 60 \
  -a 0.5 -adv \
  -lr 0.0001 --max_steps 450001 --geo beta --valid_steps 15000 \
- -betam "(1600,2)" --tasks '1p.2p.3p.2i.3i.ip.pi.2u.up' --training_tasks '1p.2p.3p.2i.3i' \
+ -betam '(1600,2,fisher,0.055,layer,True)' --tasks '1p.2p.3p.2i.3i.ip.pi.2u.up' --training_tasks '1p.2p.3p.2i.3i' \
  --save_checkpoint_steps 150000 \
  --share_negative \
  --lr_schedule none \
+ --logit_impl custom \
  --sampler_type naive \
  --filter_test \
  --share_optim_stats \
- --port 29500 \
+ --port 29510 \
  --online_sample --prefix '../logs' --online_sample_mode '(500,0,w,wstruct,120)' \
  --train_online_mode '(single,3000,e,True,before)' --optim_mode '(aggr,adam,cpu,False,5)' --online_weighted_structure_prob '(20,20,20,10,10)' --print_on_screen \
  $@
diff --git a/smore/training/beta_scripts/train_nell.sh b/smore/training/beta_scripts/train_nell.sh
index ec03505..d7ac05e 100755
--- a/smore/training/beta_scripts/train_nell.sh
+++ b/smore/training/beta_scripts/train_nell.sh
@@ -26,14 +26,15 @@ python ../main_train.py --do_train --do_test --gpus '0.1.2.3' \
  -n 1024 -b 512 -d 400 -g 60 \
  -a 0.5 -adv \
  -lr 0.0001 --max_steps 450001 --geo beta --valid_steps 15000 \
- -betam "(1600,2)" --tasks '1p.2p.3p.2i.3i.ip.pi.2u.up' --training_tasks '1p.2p.3p.2i.3i' \
+ -betam '(1600,2,fisher,0.055,layer,True)' --tasks '1p.2p.3p.2i.3i.ip.pi.2u.up' --training_tasks '1p.2p.3p.2i.3i' \
  --save_checkpoint_steps 150000 \
  --share_negative \
  --lr_schedule none \
+ --logit_impl custom \
  --sampler_type naive \
  --filter_test \
  --share_optim_stats \
- --port 29500 \
+ --port 29512 \
  --online_sample --prefix '../logs' --online_sample_mode '(500,0,w,wstruct,120)' \
  --train_online_mode '(single,3000,e,True,before)' --optim_mode '(aggr,adam,cpu,False,5)' --online_weighted_structure_prob '(20,20,20,10,10)' --print_on_screen \
  $@
diff --git a/smore/training/box_scripts/train_15k.sh b/smore/training/box_scripts/train_15k.sh
index f0e3752..dc0c62a 100755
--- a/smore/training/box_scripts/train_15k.sh
+++ b/smore/training/box_scripts/train_15k.sh
@@ -24,10 +24,11 @@ export CUDA_VISIBLE_DEVICES=0,1,2,3
 python ../main_train.py --do_train --do_test --gpus '0.1.2.3' \
  --data_path $data_folder --eval_path $eval_path \
  -n 1024 -b 512 -d 400 -g 24 \
- -lr 0.0001 --max_steps 1000001 --geo box --valid_steps 20000 \
+ -lr 0.0001 --max_steps 1500001 --geo box --valid_steps 20000 \
  -boxm '(none,0.02)' --tasks '1p.2p.3p.2i.3i.ip.pi.2u.up' --training_tasks '1p.2p.3p.2i.3i' \
  --save_checkpoint_steps 50000 \
  --sampler_type naive \
+ --logit_impl custom \
  --lr_schedule none \
  --port 29500 \
  --share_negative \
diff --git a/smore/training/box_scripts/train_237.sh b/smore/training/box_scripts/train_237.sh
index c960c77..55bb5ce 100755
--- a/smore/training/box_scripts/train_237.sh
+++ b/smore/training/box_scripts/train_237.sh
@@ -14,23 +14,24 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-data_name=FB15k-237-betae
+data_name=FB15k-237
 data_folder=$HOME/data/knowledge_graphs/$data_name
-eval_path=$data_folder/eval-original
+eval_path=$data_folder/eval-betae
 
 export CUDA_VISIBLE_DEVICES=0,1,2,3
 
 #box
-python ../main_train.py --do_test --gpus '0.1.2.3' \
+python ../main_train.py --do_train --do_test --gpus '0.1.2.3' \
  --data_path $data_folder --eval_path $eval_path \
  -n 1024 -b 512 -d 400 -g 24 \
  -lr 0.0001 --max_steps 450001 --geo box --valid_steps 15000 \
  -boxm '(none,0.02)' --tasks '1p.2p.3p.2i.3i.ip.pi.2u.up' --training_tasks '1p.2p.3p.2i.3i' \
  --save_checkpoint_steps 30000 \
+ --logit_impl custom \
  --share_negative \
  --filter_test \
  --share_optim_stats \
- --port 29500 \
+ --port 29502 \
  --online_sample --prefix '../logs' --online_sample_mode '(500,0,w,wstruct,120)' \
  --train_online_mode '(single,3000,e,True,before)' --optim_mode '(aggr,adam,cpu,False,5)' --online_weighted_structure_prob '(2,2,2,1,1)' --print_on_screen \
  $@
diff --git a/smore/training/box_scripts/train_nell.sh b/smore/training/box_scripts/train_nell.sh
index 81f8fc8..ba00618 100755
--- a/smore/training/box_scripts/train_nell.sh
+++ b/smore/training/box_scripts/train_nell.sh
@@ -24,10 +24,11 @@ export CUDA_VISIBLE_DEVICES=4,5,6,7
 python ../main_train.py --do_train --do_test --gpus '0.1.2.3' \
  --data_path $data_folder --eval_path $eval_path \
  -n 1024 -b 512 -d 400 -g 24 \
- -lr 0.0001 --max_steps 450001 --geo box --valid_steps 15000 \
+ -lr 0.0001 --max_steps 600001 --geo box --valid_steps 15000 \
  -boxm '(none,0.02)' --tasks '1p.2p.3p.2i.3i.ip.pi.2u.up' --training_tasks '1p.2p.3p.2i.3i' \
  --save_checkpoint_steps 30000 \
  --sampler_type naive \
+ --logit_impl custom \
  --port 29501 \
  --share_negative \
  --filter_test \
diff --git a/smore/training/vec_scripts/train_15k.sh b/smore/training/vec_scripts/train_15k.sh
index 85ea89f..7a2a25b 100755
--- a/smore/training/vec_scripts/train_15k.sh
+++ b/smore/training/vec_scripts/train_15k.sh
@@ -24,13 +24,14 @@ export CUDA_VISIBLE_DEVICES=0,1,2,3
 python ../main_train.py --do_train --do_test --gpus '0.1.2.3' \
  --data_path $data_folder --eval_path $eval_path \
  -n 1024 -b 512 -d 800 -g 24 \
- -lr 0.0001 --max_steps 450001 --geo vec --valid_steps 15000 \
+ -lr 0.0001 --max_steps 2000001 --geo vec --valid_steps 15000 \
  --tasks '1p.2p.3p.2i.3i.ip.pi.2u.up' --training_tasks '1p.2p.3p.2i.3i' \
  --save_checkpoint_steps 30000 \
  --sampler_type naive \
+ --logit_impl custom \
  --share_negative \
  --filter_test \
- --port 29500 \
+ --port 29503 \
  --share_optim_stats \
  --online_sample --prefix '../logs' --online_sample_mode '(500,0,w,wstruct,120)' \
  --train_online_mode '(single,3000,e,True,before)' --optim_mode '(aggr,adam,cpu,False,5)' --online_weighted_structure_prob '(2,2,2,1,1)' --print_on_screen \
diff --git a/smore/training/vec_scripts/train_237.sh b/smore/training/vec_scripts/train_237.sh
index b2a09ae..2818bac 100755
--- a/smore/training/vec_scripts/train_237.sh
+++ b/smore/training/vec_scripts/train_237.sh
@@ -14,9 +14,9 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-data_name=FB15k-237-betae
+data_name=FB15k-237
 data_folder=$HOME/data/knowledge_graphs/$data_name
-eval_path=$data_folder/eval-original
+eval_path=$data_folder/eval-betae
 
 export CUDA_VISIBLE_DEVICES=0,1,2,3
 
@@ -24,14 +24,15 @@ export CUDA_VISIBLE_DEVICES=0,1,2,3
 python ../main_train.py --do_train --do_test --gpus '0.1.2.3' \
  --data_path $data_folder --eval_path $eval_path \
  -n 1024 -b 512 -d 800 -g 24 \
- -lr 0.0001 --max_steps 750001 --geo vec --valid_steps 15000 \
+ -lr 0.0001 --max_steps 1500001 --geo vec --valid_steps 15000 \
  --tasks '1p.2p.3p.2i.3i.ip.pi.2u.up' --training_tasks '1p.2p.3p.2i.3i' \
  --save_checkpoint_steps 30000 \
  --lr_schedule none \
- --sampler_type sqrt \
+ --sampler_type naive \
+ --logit_impl custom \
  --share_negative \
  --filter_test \
- --port 29500 \
+ --port 29505 \
  --share_optim_stats \
  --online_sample --prefix '../logs' --online_sample_mode '(500,0,w,wstruct,120)' \
  --train_online_mode '(single,3000,e,True,before)' --optim_mode '(aggr,adam,cpu,False,5)' --online_weighted_structure_prob '(2,2,2,1,1)' --print_on_screen \
diff --git a/smore/training/vec_scripts/train_nell.sh b/smore/training/vec_scripts/train_nell.sh
index bc50c20..f40b15d 100755
--- a/smore/training/vec_scripts/train_nell.sh
+++ b/smore/training/vec_scripts/train_nell.sh
@@ -24,14 +24,15 @@ export CUDA_VISIBLE_DEVICES=0,1,2,3
 python ../main_train.py --do_train --do_test --gpus '0.1.2.3' \
  --data_path $data_folder --eval_path $eval_path \
  -n 1024 -b 512 -d 800 -g 24 \
- -lr 0.0001 --max_steps 800001 --geo vec --valid_steps 20000 \
+ -lr 0.0001 --max_steps 2000001 --geo vec --valid_steps 20000 \
  --tasks '1p.2p.3p.2i.3i.ip.pi.2u.up' --training_tasks '1p.2p.3p.2i.3i' \
  --save_checkpoint_steps 40000 \
- --lr_schedule step \
+ --lr_schedule none \
  --sampler_type naive \
+ --logit_impl custom \
  --share_negative \
  --filter_test \
- --port 29500 \
+ --port 29504 \
  --share_optim_stats \
  --online_sample --prefix '../logs' --online_sample_mode '(500,0,w,wstruct,120)' \
  --train_online_mode '(single,3000,e,True,before)' --optim_mode '(aggr,adam,cpu,False,5)' --online_weighted_structure_prob '(2,2,2,1,1)' --print_on_screen \