AntoineSimoulin
diff --git a/‎.gitignore
Lines changed: 3 additions & 1 deletion b/‎.gitignore
Lines changed: 3 additions & 1 deletion
diff --git a/‎README.md
Lines changed: 26 additions & 16 deletions b/‎README.md
Lines changed: 26 additions & 16 deletions
diff --git a/‎examples/README.md
Lines changed: 58 additions & 7 deletions b/‎examples/README.md
Lines changed: 58 additions & 7 deletions
@@ -1 +1,3 @@
-model/
+model/
+*.pyc
+__pycache__/
@@ -25,13 +25,19 @@ Data must be in the `str` format as detailed in the example below:
 from pytree.data import prepare_input_from_constituency_tree
 
 parse_tree_example = '(TOP (S (NP (_ I)) (VP (_ saw) (NP (_ Sarah)) (PP (_ with) (NP (_ a) (_ telescope)))) (_ .)))'
-input_test, head_idx_test = prepare_input_from_constituency_tree(parse_tree_example)
+input_test, head_idx_test, head_idx_r_test, head_idx_l_test = prepare_input_from_constituency_tree(parse_tree_example)
 
 print(input_test)
 # ['[CLS]', 'I', 'saw', 'Sarah', 'with', 'a', 'telescope', '.', '[S]', '[S]', '[VP]', '[VP]', '[PP]', '[NP]']
 
 print(head_idx_test)
-# [0, 8, 10, 10, 11, 12, 12, 7, 0, 7, 8, 9, 9, 11]
+# [0, 9, 11, 11, 12, 13, 13, 8, 0, 8, 9, 10, 10, 12]
+
+print(head_idx_r_test)
+# [0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0]
+
+print(head_idx_l_test)
+# [0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1]
 ```
 
 ### Prepare dependency tree data
@@ -68,17 +74,19 @@ from pytree.data.glove_tokenizer import GloveTokenizer
 glove_tokenizer = GloveTokenizer(glove_file_path='./glove.6B.300d.txt', vocab_size=10000)
 input_test = glove_tokenizer.convert_tokens_to_ids(input_test)
 print(input_test)
-# [1, 1, 824, 1, 19, 9, 1, 4, 1, 1, 1, 1, 1, 1]
+# [1, 1, 824, 1, 19, 9, 1, 4]
 ```
 
 Then prepare the data:
 
 ```python
-tree_ids_test, tree_ids_test_r, tree_ids_test_l = build_tree_ids_n_ary(head_idx_test)
+from pytree.data.utils import build_tree_ids_n_ary
+
+tree_ids_test, tree_ids_test_r, tree_ids_test_l = build_tree_ids_n_ary(head_idx_test, head_idx_r_test, head_idx_l_test)
 inputs = {'input_ids': torch.tensor(input_test).unsqueeze(0),
-          'packed_tree': torch.tensor(tree_ids_test).unsqueeze(0),
-          'packed_tree_r': torch.tensor(tree_ids_test_r).unsqueeze(0),
-          'packed_tree_l': torch.tensor(tree_ids_test_l).unsqueeze(0)}
+          'tree_ids': torch.tensor(tree_ids_test).unsqueeze(0),
+          'tree_ids_r': torch.tensor(tree_ids_test_r).unsqueeze(0),
+          'tree_ids_l': torch.tensor(tree_ids_test_l).unsqueeze(0)}
 ```
 
 And apply the model:
@@ -89,17 +97,19 @@ from pytree.models import NaryConfig, NaryTree
 config = NaryConfig()
 tree_encoder = NaryTree(config)
 
-tree_encoder(inputs)
+(h, c), h_root = tree_encoder(inputs)
+print(h)
 # tensor([[[ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
-#          [ 0.0012,  0.0015, -0.0026,  ..., -0.0001,  0.0002, -0.0043],
-#          [ 0.0022,  0.0024, -0.0035,  ..., -0.0002,  0.0003, -0.0058],
+#          [ 0.0113, -0.0066,  0.0089,  ...,  0.0064,  0.0076, -0.0048],
+#          [ 0.0110, -0.0073,  0.0110,  ...,  0.0070,  0.0046, -0.0049],
 #          ...,
-#          [ 0.0028,  0.0023, -0.0035,  ..., -0.0002,  0.0003, -0.0057],
-#          [ 0.0020,  0.0016, -0.0023,  ..., -0.0001,  0.0002, -0.0036],
-#          [ 0.0019,  0.0015, -0.0024,  ..., -0.0001,  0.0002, -0.0039]]],
-#        grad_fn=<MaskedScatterBackward>)
+#          [ 0.0254, -0.0138,  0.0224,  ...,  0.0131,  0.0148, -0.0143],
+#          [ 0.0346, -0.0172,  0.0281,  ...,  0.0140,  0.0198, -0.0267],
+#          [ 0.0247, -0.0126,  0.0201,  ...,  0.0116,  0.0162, -0.0184]]],
+#        grad_fn=<SWhereBackward>)
 
-print(tree_encoder(inputs).shape)
-# tree_encoder(inputs).shape
+print(h_root.shape)
+# torch.Size([150])
 ```
 
+We also provide a full demonstration with the SICK dataset and batched processing in the [examples folder](https://github.com/AntoineSimoulin/pytree/tree/main/examples). 
@@ -1,21 +1,72 @@
 Implementation of ([Tai et al., 2015](#tai-2015))
 
+For the Constituency TreeLSTM, you can run the following script:
 
 ```bash
-python pytree/examples/run_sick.py \
-    --glove_file_path ./glove.6B.300d.txt \
+python examples/run_sick_n_ary.py \
+    --glove_file_path glove.840B.300d.txt \
     --do_train \
     --do_eval \
+    --do_predict \
     --output_dir './model' \
     --dataset_name 'sick' \
-    --remove_unused_columns False \
-    --learning_rate 0.025 \
-    --per_device_train_batch_size 25 \
-    --num_train_epochs 20
+    --remove_unused_columns false \
+    --learning_rate 0.05 \
+    --per_device_train_batch_size 25 \
+    --num_train_epochs 10 \
+    --weight_decay 1e-4 \
+    --lr_scheduler_type constant \
+    --overwrite_cache false \
+    --overwrite_output_dir \
+    --evaluation_strategy epoch
 ```
 
+You should get the following results:
+
+```bash
+***** predict metrics *****
+  predict_samples         =       4906
+  test_loss               =     0.6236
+  test_mse                =    31.8074
+  test_pearson            =    83.2404
+  test_runtime            = 0:00:13.02
+  test_samples_per_second =    376.716
+  test_spearman           =    77.1604
+  test_steps_per_second   =     47.147
 ```
-CUDA_VISIBLE_DEVICES=2 python examples/run_sick.py     --glove_file_path /data/asimouli/GLOVE/glove.6B.300d.txt     --do_train     --do_eval      --output_dir './model'     --dataset_name 'sick'     --remove_unused_columns False     --learning_rate 0.05     --per_device_train_batch_size 25     --num_train_epochs 15    --weight_decay 1e-4  --lr_scheduler_type constant  --do_predict    --overwrite_cache True  --overwrite_output_dir
+
+For the Dependency TreeLSTM, you can run the following script:
+
+```bash
+python examples/run_sick_child_sum.py \
+    --glove_file_path glove.840B.300d.txt \
+    --do_train \
+    --do_eval \
+    --do_predict \
+    --output_dir './model' \
+    --dataset_name 'sick' \
+    --remove_unused_columns false \
+    --learning_rate 0.05 \
+    --per_device_train_batch_size 25 \
+    --num_train_epochs 5 \
+    --weight_decay 1e-4 \
+    --lr_scheduler_type constant \
+    --overwrite_cache true \
+    --overwrite_output_dir
+```
+
+You should get the following results:
+
+```bash
+***** predict metrics *****
+  predict_samples         =       4906
+  test_loss               =     0.5228
+  test_mse                =    26.4252
+  test_pearson            =    86.3953
+  test_runtime            = 0:00:05.74
+  test_samples_per_second =    854.158
+  test_spearman           =    80.3738
+  test_steps_per_second   =      106.9
 ```
 
 ## References
-Original file line number
+Diff line change
@@ @@ -1 +1,3 @@ @@
 -model/
 +model/
 +*.pyc
 +__pycache__/