Minh Q. Le commited on
Commit
b63a495
·
1 Parent(s): 9250417
Files changed (34) hide show
  1. Model/COSMIC/feature_extraction/comet/config/atomic/changes.json +16 -0
  2. Model/COSMIC/feature_extraction/comet/config/atomic/config_0.json +79 -0
  3. Model/COSMIC/feature_extraction/comet/config/atomic/default.json +16 -0
  4. Model/COSMIC/feature_extraction/comet/config/atomic/eval_changes.json +25 -0
  5. Model/COSMIC/feature_extraction/comet/config/conceptnet/changes.json +16 -0
  6. Model/COSMIC/feature_extraction/comet/config/conceptnet/config_0.json +61 -0
  7. Model/COSMIC/feature_extraction/comet/config/conceptnet/default.json +23 -0
  8. Model/COSMIC/feature_extraction/comet/config/conceptnet/eval_changes.json +17 -0
  9. Model/COSMIC/feature_extraction/comet/config/default.json +54 -0
  10. Model/COSMIC/feature_extraction/comet/data/atomic/README.md +33 -0
  11. Model/COSMIC/feature_extraction/comet/data/atomic/sap2019atomic.pdf +0 -0
  12. Model/COSMIC/feature_extraction/comet/model/encoder_bpe_40000.json +0 -0
  13. Model/COSMIC/feature_extraction/comet/model/params_0.npy +3 -0
  14. Model/COSMIC/feature_extraction/comet/model/params_1.npy +3 -0
  15. Model/COSMIC/feature_extraction/comet/model/params_2.npy +3 -0
  16. Model/COSMIC/feature_extraction/comet/model/params_3.npy +3 -0
  17. Model/COSMIC/feature_extraction/comet/model/params_4.npy +3 -0
  18. Model/COSMIC/feature_extraction/comet/model/params_5.npy +3 -0
  19. Model/COSMIC/feature_extraction/comet/model/params_6.npy +3 -0
  20. Model/COSMIC/feature_extraction/comet/model/params_7.npy +3 -0
  21. Model/COSMIC/feature_extraction/comet/model/params_8.npy +3 -0
  22. Model/COSMIC/feature_extraction/comet/model/params_9.npy +3 -0
  23. Model/COSMIC/feature_extraction/comet/model/params_shapes.json +1 -0
  24. Model/COSMIC/feature_extraction/comet/model/vocab_40000.bpe +0 -0
  25. Model/COSMIC/feature_extraction/epik-bin/input0/dict.txt +0 -0
  26. Model/COSMIC/feature_extraction/epik-bin/input0/train.bin +3 -0
  27. Model/COSMIC/feature_extraction/epik-bin/input0/train.idx +0 -0
  28. Model/COSMIC/feature_extraction/epik-bin/input0/valid.bin +3 -0
  29. Model/COSMIC/feature_extraction/epik-bin/input0/valid.idx +0 -0
  30. Model/COSMIC/feature_extraction/epik-bin/label/dict.txt +20 -0
  31. Model/COSMIC/feature_extraction/epik-bin/label/train.bin +3 -0
  32. Model/COSMIC/feature_extraction/epik-bin/label/train.idx +0 -0
  33. Model/COSMIC/feature_extraction/epik-bin/label/valid.bin +3 -0
  34. Model/COSMIC/feature_extraction/epik-bin/label/valid.idx +0 -0
Model/COSMIC/feature_extraction/comet/config/atomic/changes.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "base": {
3
+ "0": {
4
+ "gpu_index": 0
5
+ },
6
+ "1": {
7
+ "gpu_index": 1
8
+ },
9
+ "2": {
10
+ "gpu_index": 2
11
+ },
12
+ "3": {
13
+ "gpu_index": 3
14
+ }
15
+ }
16
+ }
Model/COSMIC/feature_extraction/comet/config/atomic/config_0.json ADDED
@@ -0,0 +1,79 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "gpu_mode": "T",
3
+ "gpu_index": 0,
4
+ "gpu_indices": [
5
+ 0,
6
+ 1
7
+ ],
8
+ "multigpu": "F",
9
+ "topk_size": 10,
10
+ "beam_size": 1,
11
+ "gen_seqlength": 40,
12
+ "eval_sampler": "greedy",
13
+ "num_sequences": 1,
14
+ "generate_sequences": "full",
15
+ "evaluate_sequences": "full",
16
+ "random_seed": 123,
17
+ "optimizer": "adam",
18
+ "batch_size": 64,
19
+ "learning_rate": 6.25e-05,
20
+ "clip": 1,
21
+ "loss": "nll",
22
+ "weight_decay": 0,
23
+ "adam": {
24
+ "b2": 0.999,
25
+ "b1": 0.9,
26
+ "e": 1e-08
27
+ },
28
+ "model": "transformer",
29
+ "pretrain": "gpt",
30
+ "hidden_dim": 768,
31
+ "num_layers": 12,
32
+ "num_heads": 12,
33
+ "embedding_dropout": 0.1,
34
+ "attention_dropout": 0.1,
35
+ "residual_dropout": 0.1,
36
+ "output_dropout": 0.1,
37
+ "activation": "gelu",
38
+ "init": "pt",
39
+ "trainer": "iteration",
40
+ "iterations": 50000,
41
+ "cycle": 500,
42
+ "save_strategy": "best",
43
+ "epochs": 20,
44
+ "toy": "F",
45
+ "do_gen": "F",
46
+ "save": "T",
47
+ "test_save": "F",
48
+ "dataset": "atomic",
49
+ "categories": [
50
+ "oReact",
51
+ "oEffect",
52
+ "oWant",
53
+ "xAttr",
54
+ "xEffect",
55
+ "xIntent",
56
+ "xNeed",
57
+ "xReact",
58
+ "xWant"
59
+ ],
60
+ "eval_categories": [
61
+ "oReact",
62
+ "oEffect",
63
+ "oWant",
64
+ "xAttr",
65
+ "xEffect",
66
+ "xIntent",
67
+ "xNeed",
68
+ "xReact",
69
+ "xWant"
70
+ ],
71
+ "exp": "generation",
72
+ "labels": "individual",
73
+ "encoder_path": "model/encoder_bpe_40000.json",
74
+ "bpe_path": "model/vocab_40000.bpe",
75
+ "learning_rate_schedule": "warmup_linear",
76
+ "learning_rate_warmup": 0.002,
77
+ "l2": 0.01,
78
+ "vector_l2": "T"
79
+ }
Model/COSMIC/feature_extraction/comet/config/atomic/default.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+
3
+ "dataset": "atomic",
4
+ "categories": ["oReact", "oEffect", "oWant", "xAttr", "xEffect", "xIntent", "xNeed", "xReact", "xWant"],
5
+ "eval_categories": ["oReact", "oEffect", "oWant", "xAttr", "xEffect", "xIntent", "xNeed", "xReact", "xWant"],
6
+ "exp": "generation",
7
+ "labels": "individual",
8
+ "encoder_path": "model/encoder_bpe_40000.json",
9
+ "bpe_path": "model/vocab_40000.bpe",
10
+ "batch_size": 64,
11
+ "learning_rate_schedule": "warmup_linear",
12
+ "learning_rate_warmup": 0.002,
13
+ "l2": 0.01,
14
+ "vector_l2": "T",
15
+ "evaluate_sequences": 10000
16
+ }
Model/COSMIC/feature_extraction/comet/config/atomic/eval_changes.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+
3
+ "base": {
4
+ "0": {
5
+ "gpu_index": 0,
6
+ "generate_sequences": "full",
7
+ "evaluate_sequences": "full"
8
+ },
9
+ "1": {
10
+ "gpu_index": 1,
11
+ "generate_sequences": "full",
12
+ "evaluate_sequences": "full"
13
+ },
14
+ "2": {
15
+ "gpu_index": 2,
16
+ "generate_sequences": "full",
17
+ "evaluate_sequences": "full"
18
+ },
19
+ "3": {
20
+ "gpu_index": 3,
21
+ "generate_sequences": "full",
22
+ "evaluate_sequences": "full"
23
+ }
24
+ }
25
+ }
Model/COSMIC/feature_extraction/comet/config/conceptnet/changes.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "base": {
3
+ "0": {
4
+ "gpu_index": 0
5
+ },
6
+ "1": {
7
+ "gpu_index": 1
8
+ },
9
+ "2": {
10
+ "gpu_index": 2
11
+ },
12
+ "3": {
13
+ "gpu_index": 3
14
+ }
15
+ }
16
+ }
Model/COSMIC/feature_extraction/comet/config/conceptnet/config_0.json ADDED
@@ -0,0 +1,61 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "gpu_mode": "T",
3
+ "gpu_index": 0,
4
+ "gpu_indices": [
5
+ 0,
6
+ 1
7
+ ],
8
+ "multigpu": "F",
9
+ "topk_size": 10,
10
+ "beam_size": 1,
11
+ "gen_seqlength": 40,
12
+ "eval_sampler": "greedy",
13
+ "num_sequences": 1,
14
+ "generate_sequences": "full",
15
+ "evaluate_sequences": "full",
16
+ "random_seed": 123,
17
+ "optimizer": "adam",
18
+ "batch_size": 64,
19
+ "learning_rate": 1e-05,
20
+ "clip": 1,
21
+ "loss": "nll",
22
+ "weight_decay": 0,
23
+ "adam": {
24
+ "b2": 0.999,
25
+ "b1": 0.9,
26
+ "e": 1e-08
27
+ },
28
+ "model": "transformer",
29
+ "pretrain": "gpt",
30
+ "hidden_dim": 768,
31
+ "num_layers": 12,
32
+ "num_heads": 12,
33
+ "embedding_dropout": 0.1,
34
+ "attention_dropout": 0.1,
35
+ "residual_dropout": 0.1,
36
+ "output_dropout": 0.1,
37
+ "activation": "gelu",
38
+ "init": "pt",
39
+ "trainer": "iteration",
40
+ "iterations": 100000,
41
+ "cycle": 500,
42
+ "save_strategy": "best",
43
+ "epochs": 20,
44
+ "toy": "F",
45
+ "do_gen": "T",
46
+ "save": "T",
47
+ "test_save": "F",
48
+ "dataset": "conceptnet",
49
+ "exp": "generation",
50
+ "encoder_path": "model/encoder_bpe_40000.json",
51
+ "bpe_path": "model/vocab_40000.bpe",
52
+ "learning_rate_schedule": "warmup_linear",
53
+ "learning_rate_warmup": 0.002,
54
+ "l2": 0.01,
55
+ "vector_l2": "T",
56
+ "relation_format": "language",
57
+ "training_set_size": 100,
58
+ "development_set_versions_to_use": "12",
59
+ "max_event_1_size": 10,
60
+ "max_event_2_size": 15
61
+ }
Model/COSMIC/feature_extraction/comet/config/conceptnet/default.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+
3
+ "dataset": "conceptnet",
4
+ "exp": "generation",
5
+ "do_gen": "T",
6
+ "encoder_path": "model/encoder_bpe_40000.json",
7
+ "bpe_path": "model/vocab_40000.bpe",
8
+ "batch_size": 64,
9
+ "learning_rate_schedule": "warmup_linear",
10
+ "learning_rate_warmup": 0.002,
11
+ "l2": 0.01,
12
+ "vector_l2": "T",
13
+ "generate_sequences": "full",
14
+ "evaluate_sequences": "full",
15
+ "relation_format": "language",
16
+ "training_set_size": 100,
17
+ "development_set_versions_to_use": "12",
18
+ "max_event_1_size": 10,
19
+ "max_event_2_size": 15,
20
+ "eval_sampler": "greedy",
21
+ "iterations": 100000,
22
+ "learning_rate": 1e-5
23
+ }
Model/COSMIC/feature_extraction/comet/config/conceptnet/eval_changes.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+
3
+ "base": {
4
+ "0": {
5
+ "gpu_index": 0
6
+ },
7
+ "1": {
8
+ "gpu_index": 1
9
+ },
10
+ "2": {
11
+ "gpu_index": 2
12
+ },
13
+ "3": {
14
+ "gpu_index": 3
15
+ }
16
+ }
17
+ }
Model/COSMIC/feature_extraction/comet/config/default.json ADDED
@@ -0,0 +1,54 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "gpu_mode": "T",
3
+ "gpu_index": 0,
4
+ "gpu_indices": [0, 1],
5
+ "multigpu": "F",
6
+
7
+ "topk_size": 10,
8
+ "beam_size": 1,
9
+ "gen_seqlength": 40,
10
+ "eval_sampler": "greedy",
11
+ "num_sequences": 1,
12
+ "generate_sequences": 1000,
13
+ "evaluate_sequences": 10000,
14
+
15
+ "random_seed": 123,
16
+ "optimizer": "adam",
17
+ "batch_size": 64,
18
+ "learning_rate": 6.25e-5,
19
+
20
+ "clip": 1,
21
+ "loss": "nll",
22
+ "weight_decay": 0,
23
+
24
+ "adam": {
25
+ "b2": 0.999,
26
+ "b1": 0.9,
27
+ "e": 1e-8
28
+ },
29
+
30
+ "model": "transformer",
31
+ "pretrain": "gpt",
32
+ "hidden_dim": 768,
33
+ "num_layers": 12,
34
+ "num_heads": 12,
35
+ "embedding_dropout": 0.1,
36
+ "attention_dropout": 0.1,
37
+ "residual_dropout": 0.1,
38
+ "output_dropout": 0.1,
39
+ "activation": "gelu",
40
+ "init": "pt",
41
+
42
+ "trainer": "iteration",
43
+
44
+ "iterations": 50000,
45
+ "cycle": 500,
46
+
47
+ "save_strategy": "best",
48
+
49
+ "epochs": 20,
50
+ "toy": "F",
51
+ "do_gen": "F",
52
+ "save": "T",
53
+ "test_save": "F"
54
+ }
Model/COSMIC/feature_extraction/comet/data/atomic/README.md ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # ATOMIC
2
+
3
+ This tarball contains the ATOMIC knowledge graph.
4
+ Files present:
5
+ - `v4_atomic_all_agg.csv`: contains one event per line, with all annotations aggregated into one list (but not de-duplicated, so there might be repeats).
6
+ - `v4_atomic_all.csv`: keeps track of which worker did which annotations. Each line is the answers from one worker only, so there are multiple lines for the same event.
7
+ - `v4_atomic_trn.csv`, `v4_atomic_dev.csv`, `v4_atomic_tst.csv`: same as above, but split based on train/dev/test split.
8
+
9
+ All files are CSVs containing the following columns:
10
+ - event: just a string representation of the event.
11
+ - oEffect,oReact,oWant,xAttr,xEffect,xIntent,xNeed,xReact,xWant: annotations for each of the dimensions, stored in a json-dumped list of strings.
12
+ **Note**: `[""none""]` means the worker explicitly responded with the empty response, whereas `[]` means the worker did not annotate this dimension.
13
+ - prefix: json-dumped list that represents the prefix of content words (used to make a better trn/dev/tst split).
14
+ - split: string rep of which split the event belongs to.
15
+
16
+ Suggested code for loading the data into a pandas dataframe:
17
+ ```python
18
+ import pandas as pd
19
+ import json
20
+
21
+ df = pd.read_csv("v4_atomic_all.csv",index_col=0)
22
+ df.iloc[:,:9] = df.iloc[:,:9].apply(lambda col: col.apply(json.loads))
23
+ ```
24
+
25
+ **_Disclaimer/Content warning_**: the events in atomic have been automatically extracted from blogs, stories and books written at various times.
26
+ The events might depict violent or problematic actions, which we left in the corpus for the sake of learning the (probably negative but still important) commonsense implications associated with the events.
27
+ We removed a small set of truly out-dated events, but might have missed some so please email us ([email protected]) if you have any concerns.
28
+
29
+ ## Paper
30
+ Please cite the following work when using this data:
31
+
32
+ > Maarten Sap, Ronan LeBras, Emily Allaway, Chandra Bhagavatula, Nicholas Lourie, Hannah Rashkin, Brendan Roof, Noah A. Smith & Yejin Choi (2019).
33
+ > ATOMIC: An Atlas of Machine Commonsense for If-Then Reasoning. AAAI
Model/COSMIC/feature_extraction/comet/data/atomic/sap2019atomic.pdf ADDED
Binary file (745 kB). View file
 
Model/COSMIC/feature_extraction/comet/model/encoder_bpe_40000.json ADDED
The diff for this file is too large to render. See raw diff
 
Model/COSMIC/feature_extraction/comet/model/params_0.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d9cd095b901dfbfbe0ce5e01d151dfe0b791e955d71149969ba65a6eab4480f
3
+ size 46614044
Model/COSMIC/feature_extraction/comet/model/params_1.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca074893c040fa69cbf2fc95c06feda45a4e1492d03b645e2076e89ccf7ddd9f
3
+ size 46614044
Model/COSMIC/feature_extraction/comet/model/params_2.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:966c25fbd632f0df18c4d4380ba57f23410f43311a96616f00b3d05ae6592f58
3
+ size 46614044
Model/COSMIC/feature_extraction/comet/model/params_3.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40df0d328f5d3d1b2bec768855a5d2eeeaf2b2124758ef98116f76a02526fd92
3
+ size 46614044
Model/COSMIC/feature_extraction/comet/model/params_4.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:139f098dcd620ccf0200530e9ce9ff1c342714ff881a0c7258ac9faac4a06e6a
3
+ size 46614040
Model/COSMIC/feature_extraction/comet/model/params_5.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad27b5cb245db9a29657270ff637d3ff1c15fd9df3683324a2936674cef8c3c5
3
+ size 46614040
Model/COSMIC/feature_extraction/comet/model/params_6.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af5bb5c76ddfea50683e0b9895fe704ae689853ed8bb3f1b3fee4daff2f27d45
3
+ size 46614040
Model/COSMIC/feature_extraction/comet/model/params_7.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27f55501d895ce1adb9b254aa762519a242edf2bcd2b43298b89538b5591566c
3
+ size 46614040
Model/COSMIC/feature_extraction/comet/model/params_8.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17a2b695128ea0aae98a360351b92769b879bc0f2835862949b6405b0ce88569
3
+ size 46614040
Model/COSMIC/feature_extraction/comet/model/params_9.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1355fcd519db223f65db7fa7b79dcaf9b4c653915ffe4bd417d87f7903225c1
3
+ size 46614040
Model/COSMIC/feature_extraction/comet/model/params_shapes.json ADDED
@@ -0,0 +1 @@
 
 
1
+ [[512, 768], [40478, 768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768]]
Model/COSMIC/feature_extraction/comet/model/vocab_40000.bpe ADDED
The diff for this file is too large to render. See raw diff
 
Model/COSMIC/feature_extraction/epik-bin/input0/dict.txt ADDED
The diff for this file is too large to render. See raw diff
 
Model/COSMIC/feature_extraction/epik-bin/input0/train.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed51da33e9e82f6caf591795fdd8113dbc0c4a53a418f7eeb06b114f5f5b6b28
3
+ size 1775332
Model/COSMIC/feature_extraction/epik-bin/input0/train.idx ADDED
Binary file (820 kB). View file
 
Model/COSMIC/feature_extraction/epik-bin/input0/valid.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bb9cf83ea51adf9bdf7bbb90186d232b7d8c5e8c6fa5d4fa75daf61b1ba0707
3
+ size 223948
Model/COSMIC/feature_extraction/epik-bin/input0/valid.idx ADDED
Binary file (105 kB). View file
 
Model/COSMIC/feature_extraction/epik-bin/label/dict.txt ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 0 14125
2
+ 1 7674
3
+ 2 7674
4
+ 3 6735
5
+ 4 5564
6
+ 5 4875
7
+ 6 3589
8
+ 7 3475
9
+ 8 3045
10
+ 9 2900
11
+ 10 2823
12
+ 11 1918
13
+ 12 1616
14
+ 13 1423
15
+ 14 931
16
+ madeupword0000 0
17
+ madeupword0001 0
18
+ madeupword0002 0
19
+ madeupword0003 0
20
+ madeupword0004 0
Model/COSMIC/feature_extraction/epik-bin/label/train.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84917004eb53f27db1e68c2b6ff14eafb193e5f3c43cbe995a6fc1cf22a4b442
3
+ size 273468
Model/COSMIC/feature_extraction/epik-bin/label/train.idx ADDED
Binary file (820 kB). View file
 
Model/COSMIC/feature_extraction/epik-bin/label/valid.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5637d7a2e1353adf06ec34cdfeaf6ce2f002b0de466ef15afe84e2c0dd3f24a6
3
+ size 35136
Model/COSMIC/feature_extraction/epik-bin/label/valid.idx ADDED
Binary file (105 kB). View file