Spaces:
Sleeping
Sleeping
Minh Q. Le
commited on
Commit
·
b63a495
1
Parent(s):
9250417
Push data
Browse files- Model/COSMIC/feature_extraction/comet/config/atomic/changes.json +16 -0
- Model/COSMIC/feature_extraction/comet/config/atomic/config_0.json +79 -0
- Model/COSMIC/feature_extraction/comet/config/atomic/default.json +16 -0
- Model/COSMIC/feature_extraction/comet/config/atomic/eval_changes.json +25 -0
- Model/COSMIC/feature_extraction/comet/config/conceptnet/changes.json +16 -0
- Model/COSMIC/feature_extraction/comet/config/conceptnet/config_0.json +61 -0
- Model/COSMIC/feature_extraction/comet/config/conceptnet/default.json +23 -0
- Model/COSMIC/feature_extraction/comet/config/conceptnet/eval_changes.json +17 -0
- Model/COSMIC/feature_extraction/comet/config/default.json +54 -0
- Model/COSMIC/feature_extraction/comet/data/atomic/README.md +33 -0
- Model/COSMIC/feature_extraction/comet/data/atomic/sap2019atomic.pdf +0 -0
- Model/COSMIC/feature_extraction/comet/model/encoder_bpe_40000.json +0 -0
- Model/COSMIC/feature_extraction/comet/model/params_0.npy +3 -0
- Model/COSMIC/feature_extraction/comet/model/params_1.npy +3 -0
- Model/COSMIC/feature_extraction/comet/model/params_2.npy +3 -0
- Model/COSMIC/feature_extraction/comet/model/params_3.npy +3 -0
- Model/COSMIC/feature_extraction/comet/model/params_4.npy +3 -0
- Model/COSMIC/feature_extraction/comet/model/params_5.npy +3 -0
- Model/COSMIC/feature_extraction/comet/model/params_6.npy +3 -0
- Model/COSMIC/feature_extraction/comet/model/params_7.npy +3 -0
- Model/COSMIC/feature_extraction/comet/model/params_8.npy +3 -0
- Model/COSMIC/feature_extraction/comet/model/params_9.npy +3 -0
- Model/COSMIC/feature_extraction/comet/model/params_shapes.json +1 -0
- Model/COSMIC/feature_extraction/comet/model/vocab_40000.bpe +0 -0
- Model/COSMIC/feature_extraction/epik-bin/input0/dict.txt +0 -0
- Model/COSMIC/feature_extraction/epik-bin/input0/train.bin +3 -0
- Model/COSMIC/feature_extraction/epik-bin/input0/train.idx +0 -0
- Model/COSMIC/feature_extraction/epik-bin/input0/valid.bin +3 -0
- Model/COSMIC/feature_extraction/epik-bin/input0/valid.idx +0 -0
- Model/COSMIC/feature_extraction/epik-bin/label/dict.txt +20 -0
- Model/COSMIC/feature_extraction/epik-bin/label/train.bin +3 -0
- Model/COSMIC/feature_extraction/epik-bin/label/train.idx +0 -0
- Model/COSMIC/feature_extraction/epik-bin/label/valid.bin +3 -0
- Model/COSMIC/feature_extraction/epik-bin/label/valid.idx +0 -0
Model/COSMIC/feature_extraction/comet/config/atomic/changes.json
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"base": {
|
3 |
+
"0": {
|
4 |
+
"gpu_index": 0
|
5 |
+
},
|
6 |
+
"1": {
|
7 |
+
"gpu_index": 1
|
8 |
+
},
|
9 |
+
"2": {
|
10 |
+
"gpu_index": 2
|
11 |
+
},
|
12 |
+
"3": {
|
13 |
+
"gpu_index": 3
|
14 |
+
}
|
15 |
+
}
|
16 |
+
}
|
Model/COSMIC/feature_extraction/comet/config/atomic/config_0.json
ADDED
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"gpu_mode": "T",
|
3 |
+
"gpu_index": 0,
|
4 |
+
"gpu_indices": [
|
5 |
+
0,
|
6 |
+
1
|
7 |
+
],
|
8 |
+
"multigpu": "F",
|
9 |
+
"topk_size": 10,
|
10 |
+
"beam_size": 1,
|
11 |
+
"gen_seqlength": 40,
|
12 |
+
"eval_sampler": "greedy",
|
13 |
+
"num_sequences": 1,
|
14 |
+
"generate_sequences": "full",
|
15 |
+
"evaluate_sequences": "full",
|
16 |
+
"random_seed": 123,
|
17 |
+
"optimizer": "adam",
|
18 |
+
"batch_size": 64,
|
19 |
+
"learning_rate": 6.25e-05,
|
20 |
+
"clip": 1,
|
21 |
+
"loss": "nll",
|
22 |
+
"weight_decay": 0,
|
23 |
+
"adam": {
|
24 |
+
"b2": 0.999,
|
25 |
+
"b1": 0.9,
|
26 |
+
"e": 1e-08
|
27 |
+
},
|
28 |
+
"model": "transformer",
|
29 |
+
"pretrain": "gpt",
|
30 |
+
"hidden_dim": 768,
|
31 |
+
"num_layers": 12,
|
32 |
+
"num_heads": 12,
|
33 |
+
"embedding_dropout": 0.1,
|
34 |
+
"attention_dropout": 0.1,
|
35 |
+
"residual_dropout": 0.1,
|
36 |
+
"output_dropout": 0.1,
|
37 |
+
"activation": "gelu",
|
38 |
+
"init": "pt",
|
39 |
+
"trainer": "iteration",
|
40 |
+
"iterations": 50000,
|
41 |
+
"cycle": 500,
|
42 |
+
"save_strategy": "best",
|
43 |
+
"epochs": 20,
|
44 |
+
"toy": "F",
|
45 |
+
"do_gen": "F",
|
46 |
+
"save": "T",
|
47 |
+
"test_save": "F",
|
48 |
+
"dataset": "atomic",
|
49 |
+
"categories": [
|
50 |
+
"oReact",
|
51 |
+
"oEffect",
|
52 |
+
"oWant",
|
53 |
+
"xAttr",
|
54 |
+
"xEffect",
|
55 |
+
"xIntent",
|
56 |
+
"xNeed",
|
57 |
+
"xReact",
|
58 |
+
"xWant"
|
59 |
+
],
|
60 |
+
"eval_categories": [
|
61 |
+
"oReact",
|
62 |
+
"oEffect",
|
63 |
+
"oWant",
|
64 |
+
"xAttr",
|
65 |
+
"xEffect",
|
66 |
+
"xIntent",
|
67 |
+
"xNeed",
|
68 |
+
"xReact",
|
69 |
+
"xWant"
|
70 |
+
],
|
71 |
+
"exp": "generation",
|
72 |
+
"labels": "individual",
|
73 |
+
"encoder_path": "model/encoder_bpe_40000.json",
|
74 |
+
"bpe_path": "model/vocab_40000.bpe",
|
75 |
+
"learning_rate_schedule": "warmup_linear",
|
76 |
+
"learning_rate_warmup": 0.002,
|
77 |
+
"l2": 0.01,
|
78 |
+
"vector_l2": "T"
|
79 |
+
}
|
Model/COSMIC/feature_extraction/comet/config/atomic/default.json
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
|
3 |
+
"dataset": "atomic",
|
4 |
+
"categories": ["oReact", "oEffect", "oWant", "xAttr", "xEffect", "xIntent", "xNeed", "xReact", "xWant"],
|
5 |
+
"eval_categories": ["oReact", "oEffect", "oWant", "xAttr", "xEffect", "xIntent", "xNeed", "xReact", "xWant"],
|
6 |
+
"exp": "generation",
|
7 |
+
"labels": "individual",
|
8 |
+
"encoder_path": "model/encoder_bpe_40000.json",
|
9 |
+
"bpe_path": "model/vocab_40000.bpe",
|
10 |
+
"batch_size": 64,
|
11 |
+
"learning_rate_schedule": "warmup_linear",
|
12 |
+
"learning_rate_warmup": 0.002,
|
13 |
+
"l2": 0.01,
|
14 |
+
"vector_l2": "T",
|
15 |
+
"evaluate_sequences": 10000
|
16 |
+
}
|
Model/COSMIC/feature_extraction/comet/config/atomic/eval_changes.json
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
|
3 |
+
"base": {
|
4 |
+
"0": {
|
5 |
+
"gpu_index": 0,
|
6 |
+
"generate_sequences": "full",
|
7 |
+
"evaluate_sequences": "full"
|
8 |
+
},
|
9 |
+
"1": {
|
10 |
+
"gpu_index": 1,
|
11 |
+
"generate_sequences": "full",
|
12 |
+
"evaluate_sequences": "full"
|
13 |
+
},
|
14 |
+
"2": {
|
15 |
+
"gpu_index": 2,
|
16 |
+
"generate_sequences": "full",
|
17 |
+
"evaluate_sequences": "full"
|
18 |
+
},
|
19 |
+
"3": {
|
20 |
+
"gpu_index": 3,
|
21 |
+
"generate_sequences": "full",
|
22 |
+
"evaluate_sequences": "full"
|
23 |
+
}
|
24 |
+
}
|
25 |
+
}
|
Model/COSMIC/feature_extraction/comet/config/conceptnet/changes.json
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"base": {
|
3 |
+
"0": {
|
4 |
+
"gpu_index": 0
|
5 |
+
},
|
6 |
+
"1": {
|
7 |
+
"gpu_index": 1
|
8 |
+
},
|
9 |
+
"2": {
|
10 |
+
"gpu_index": 2
|
11 |
+
},
|
12 |
+
"3": {
|
13 |
+
"gpu_index": 3
|
14 |
+
}
|
15 |
+
}
|
16 |
+
}
|
Model/COSMIC/feature_extraction/comet/config/conceptnet/config_0.json
ADDED
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"gpu_mode": "T",
|
3 |
+
"gpu_index": 0,
|
4 |
+
"gpu_indices": [
|
5 |
+
0,
|
6 |
+
1
|
7 |
+
],
|
8 |
+
"multigpu": "F",
|
9 |
+
"topk_size": 10,
|
10 |
+
"beam_size": 1,
|
11 |
+
"gen_seqlength": 40,
|
12 |
+
"eval_sampler": "greedy",
|
13 |
+
"num_sequences": 1,
|
14 |
+
"generate_sequences": "full",
|
15 |
+
"evaluate_sequences": "full",
|
16 |
+
"random_seed": 123,
|
17 |
+
"optimizer": "adam",
|
18 |
+
"batch_size": 64,
|
19 |
+
"learning_rate": 1e-05,
|
20 |
+
"clip": 1,
|
21 |
+
"loss": "nll",
|
22 |
+
"weight_decay": 0,
|
23 |
+
"adam": {
|
24 |
+
"b2": 0.999,
|
25 |
+
"b1": 0.9,
|
26 |
+
"e": 1e-08
|
27 |
+
},
|
28 |
+
"model": "transformer",
|
29 |
+
"pretrain": "gpt",
|
30 |
+
"hidden_dim": 768,
|
31 |
+
"num_layers": 12,
|
32 |
+
"num_heads": 12,
|
33 |
+
"embedding_dropout": 0.1,
|
34 |
+
"attention_dropout": 0.1,
|
35 |
+
"residual_dropout": 0.1,
|
36 |
+
"output_dropout": 0.1,
|
37 |
+
"activation": "gelu",
|
38 |
+
"init": "pt",
|
39 |
+
"trainer": "iteration",
|
40 |
+
"iterations": 100000,
|
41 |
+
"cycle": 500,
|
42 |
+
"save_strategy": "best",
|
43 |
+
"epochs": 20,
|
44 |
+
"toy": "F",
|
45 |
+
"do_gen": "T",
|
46 |
+
"save": "T",
|
47 |
+
"test_save": "F",
|
48 |
+
"dataset": "conceptnet",
|
49 |
+
"exp": "generation",
|
50 |
+
"encoder_path": "model/encoder_bpe_40000.json",
|
51 |
+
"bpe_path": "model/vocab_40000.bpe",
|
52 |
+
"learning_rate_schedule": "warmup_linear",
|
53 |
+
"learning_rate_warmup": 0.002,
|
54 |
+
"l2": 0.01,
|
55 |
+
"vector_l2": "T",
|
56 |
+
"relation_format": "language",
|
57 |
+
"training_set_size": 100,
|
58 |
+
"development_set_versions_to_use": "12",
|
59 |
+
"max_event_1_size": 10,
|
60 |
+
"max_event_2_size": 15
|
61 |
+
}
|
Model/COSMIC/feature_extraction/comet/config/conceptnet/default.json
ADDED
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
|
3 |
+
"dataset": "conceptnet",
|
4 |
+
"exp": "generation",
|
5 |
+
"do_gen": "T",
|
6 |
+
"encoder_path": "model/encoder_bpe_40000.json",
|
7 |
+
"bpe_path": "model/vocab_40000.bpe",
|
8 |
+
"batch_size": 64,
|
9 |
+
"learning_rate_schedule": "warmup_linear",
|
10 |
+
"learning_rate_warmup": 0.002,
|
11 |
+
"l2": 0.01,
|
12 |
+
"vector_l2": "T",
|
13 |
+
"generate_sequences": "full",
|
14 |
+
"evaluate_sequences": "full",
|
15 |
+
"relation_format": "language",
|
16 |
+
"training_set_size": 100,
|
17 |
+
"development_set_versions_to_use": "12",
|
18 |
+
"max_event_1_size": 10,
|
19 |
+
"max_event_2_size": 15,
|
20 |
+
"eval_sampler": "greedy",
|
21 |
+
"iterations": 100000,
|
22 |
+
"learning_rate": 1e-5
|
23 |
+
}
|
Model/COSMIC/feature_extraction/comet/config/conceptnet/eval_changes.json
ADDED
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
|
3 |
+
"base": {
|
4 |
+
"0": {
|
5 |
+
"gpu_index": 0
|
6 |
+
},
|
7 |
+
"1": {
|
8 |
+
"gpu_index": 1
|
9 |
+
},
|
10 |
+
"2": {
|
11 |
+
"gpu_index": 2
|
12 |
+
},
|
13 |
+
"3": {
|
14 |
+
"gpu_index": 3
|
15 |
+
}
|
16 |
+
}
|
17 |
+
}
|
Model/COSMIC/feature_extraction/comet/config/default.json
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"gpu_mode": "T",
|
3 |
+
"gpu_index": 0,
|
4 |
+
"gpu_indices": [0, 1],
|
5 |
+
"multigpu": "F",
|
6 |
+
|
7 |
+
"topk_size": 10,
|
8 |
+
"beam_size": 1,
|
9 |
+
"gen_seqlength": 40,
|
10 |
+
"eval_sampler": "greedy",
|
11 |
+
"num_sequences": 1,
|
12 |
+
"generate_sequences": 1000,
|
13 |
+
"evaluate_sequences": 10000,
|
14 |
+
|
15 |
+
"random_seed": 123,
|
16 |
+
"optimizer": "adam",
|
17 |
+
"batch_size": 64,
|
18 |
+
"learning_rate": 6.25e-5,
|
19 |
+
|
20 |
+
"clip": 1,
|
21 |
+
"loss": "nll",
|
22 |
+
"weight_decay": 0,
|
23 |
+
|
24 |
+
"adam": {
|
25 |
+
"b2": 0.999,
|
26 |
+
"b1": 0.9,
|
27 |
+
"e": 1e-8
|
28 |
+
},
|
29 |
+
|
30 |
+
"model": "transformer",
|
31 |
+
"pretrain": "gpt",
|
32 |
+
"hidden_dim": 768,
|
33 |
+
"num_layers": 12,
|
34 |
+
"num_heads": 12,
|
35 |
+
"embedding_dropout": 0.1,
|
36 |
+
"attention_dropout": 0.1,
|
37 |
+
"residual_dropout": 0.1,
|
38 |
+
"output_dropout": 0.1,
|
39 |
+
"activation": "gelu",
|
40 |
+
"init": "pt",
|
41 |
+
|
42 |
+
"trainer": "iteration",
|
43 |
+
|
44 |
+
"iterations": 50000,
|
45 |
+
"cycle": 500,
|
46 |
+
|
47 |
+
"save_strategy": "best",
|
48 |
+
|
49 |
+
"epochs": 20,
|
50 |
+
"toy": "F",
|
51 |
+
"do_gen": "F",
|
52 |
+
"save": "T",
|
53 |
+
"test_save": "F"
|
54 |
+
}
|
Model/COSMIC/feature_extraction/comet/data/atomic/README.md
ADDED
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# ATOMIC
|
2 |
+
|
3 |
+
This tarball contains the ATOMIC knowledge graph.
|
4 |
+
Files present:
|
5 |
+
- `v4_atomic_all_agg.csv`: contains one event per line, with all annotations aggregated into one list (but not de-duplicated, so there might be repeats).
|
6 |
+
- `v4_atomic_all.csv`: keeps track of which worker did which annotations. Each line is the answers from one worker only, so there are multiple lines for the same event.
|
7 |
+
- `v4_atomic_trn.csv`, `v4_atomic_dev.csv`, `v4_atomic_tst.csv`: same as above, but split based on train/dev/test split.
|
8 |
+
|
9 |
+
All files are CSVs containing the following columns:
|
10 |
+
- event: just a string representation of the event.
|
11 |
+
- oEffect,oReact,oWant,xAttr,xEffect,xIntent,xNeed,xReact,xWant: annotations for each of the dimensions, stored in a json-dumped list of strings.
|
12 |
+
**Note**: `[""none""]` means the worker explicitly responded with the empty response, whereas `[]` means the worker did not annotate this dimension.
|
13 |
+
- prefix: json-dumped list that represents the prefix of content words (used to make a better trn/dev/tst split).
|
14 |
+
- split: string rep of which split the event belongs to.
|
15 |
+
|
16 |
+
Suggested code for loading the data into a pandas dataframe:
|
17 |
+
```python
|
18 |
+
import pandas as pd
|
19 |
+
import json
|
20 |
+
|
21 |
+
df = pd.read_csv("v4_atomic_all.csv",index_col=0)
|
22 |
+
df.iloc[:,:9] = df.iloc[:,:9].apply(lambda col: col.apply(json.loads))
|
23 |
+
```
|
24 |
+
|
25 |
+
**_Disclaimer/Content warning_**: the events in atomic have been automatically extracted from blogs, stories and books written at various times.
|
26 |
+
The events might depict violent or problematic actions, which we left in the corpus for the sake of learning the (probably negative but still important) commonsense implications associated with the events.
|
27 |
+
We removed a small set of truly out-dated events, but might have missed some so please email us ([email protected]) if you have any concerns.
|
28 |
+
|
29 |
+
## Paper
|
30 |
+
Please cite the following work when using this data:
|
31 |
+
|
32 |
+
> Maarten Sap, Ronan LeBras, Emily Allaway, Chandra Bhagavatula, Nicholas Lourie, Hannah Rashkin, Brendan Roof, Noah A. Smith & Yejin Choi (2019).
|
33 |
+
> ATOMIC: An Atlas of Machine Commonsense for If-Then Reasoning. AAAI
|
Model/COSMIC/feature_extraction/comet/data/atomic/sap2019atomic.pdf
ADDED
Binary file (745 kB). View file
|
|
Model/COSMIC/feature_extraction/comet/model/encoder_bpe_40000.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
Model/COSMIC/feature_extraction/comet/model/params_0.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d9cd095b901dfbfbe0ce5e01d151dfe0b791e955d71149969ba65a6eab4480f
|
3 |
+
size 46614044
|
Model/COSMIC/feature_extraction/comet/model/params_1.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca074893c040fa69cbf2fc95c06feda45a4e1492d03b645e2076e89ccf7ddd9f
|
3 |
+
size 46614044
|
Model/COSMIC/feature_extraction/comet/model/params_2.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:966c25fbd632f0df18c4d4380ba57f23410f43311a96616f00b3d05ae6592f58
|
3 |
+
size 46614044
|
Model/COSMIC/feature_extraction/comet/model/params_3.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40df0d328f5d3d1b2bec768855a5d2eeeaf2b2124758ef98116f76a02526fd92
|
3 |
+
size 46614044
|
Model/COSMIC/feature_extraction/comet/model/params_4.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:139f098dcd620ccf0200530e9ce9ff1c342714ff881a0c7258ac9faac4a06e6a
|
3 |
+
size 46614040
|
Model/COSMIC/feature_extraction/comet/model/params_5.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad27b5cb245db9a29657270ff637d3ff1c15fd9df3683324a2936674cef8c3c5
|
3 |
+
size 46614040
|
Model/COSMIC/feature_extraction/comet/model/params_6.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af5bb5c76ddfea50683e0b9895fe704ae689853ed8bb3f1b3fee4daff2f27d45
|
3 |
+
size 46614040
|
Model/COSMIC/feature_extraction/comet/model/params_7.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27f55501d895ce1adb9b254aa762519a242edf2bcd2b43298b89538b5591566c
|
3 |
+
size 46614040
|
Model/COSMIC/feature_extraction/comet/model/params_8.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17a2b695128ea0aae98a360351b92769b879bc0f2835862949b6405b0ce88569
|
3 |
+
size 46614040
|
Model/COSMIC/feature_extraction/comet/model/params_9.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1355fcd519db223f65db7fa7b79dcaf9b4c653915ffe4bd417d87f7903225c1
|
3 |
+
size 46614040
|
Model/COSMIC/feature_extraction/comet/model/params_shapes.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
[[512, 768], [40478, 768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768], [1, 768, 2304], [2304], [1, 768, 768], [768], [768], [768], [1, 768, 3072], [3072], [1, 3072, 768], [768], [768], [768]]
|
Model/COSMIC/feature_extraction/comet/model/vocab_40000.bpe
ADDED
The diff for this file is too large to render.
See raw diff
|
|
Model/COSMIC/feature_extraction/epik-bin/input0/dict.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
Model/COSMIC/feature_extraction/epik-bin/input0/train.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed51da33e9e82f6caf591795fdd8113dbc0c4a53a418f7eeb06b114f5f5b6b28
|
3 |
+
size 1775332
|
Model/COSMIC/feature_extraction/epik-bin/input0/train.idx
ADDED
Binary file (820 kB). View file
|
|
Model/COSMIC/feature_extraction/epik-bin/input0/valid.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bb9cf83ea51adf9bdf7bbb90186d232b7d8c5e8c6fa5d4fa75daf61b1ba0707
|
3 |
+
size 223948
|
Model/COSMIC/feature_extraction/epik-bin/input0/valid.idx
ADDED
Binary file (105 kB). View file
|
|
Model/COSMIC/feature_extraction/epik-bin/label/dict.txt
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
0 14125
|
2 |
+
1 7674
|
3 |
+
2 7674
|
4 |
+
3 6735
|
5 |
+
4 5564
|
6 |
+
5 4875
|
7 |
+
6 3589
|
8 |
+
7 3475
|
9 |
+
8 3045
|
10 |
+
9 2900
|
11 |
+
10 2823
|
12 |
+
11 1918
|
13 |
+
12 1616
|
14 |
+
13 1423
|
15 |
+
14 931
|
16 |
+
madeupword0000 0
|
17 |
+
madeupword0001 0
|
18 |
+
madeupword0002 0
|
19 |
+
madeupword0003 0
|
20 |
+
madeupword0004 0
|
Model/COSMIC/feature_extraction/epik-bin/label/train.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84917004eb53f27db1e68c2b6ff14eafb193e5f3c43cbe995a6fc1cf22a4b442
|
3 |
+
size 273468
|
Model/COSMIC/feature_extraction/epik-bin/label/train.idx
ADDED
Binary file (820 kB). View file
|
|
Model/COSMIC/feature_extraction/epik-bin/label/valid.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5637d7a2e1353adf06ec34cdfeaf6ce2f002b0de466ef15afe84e2c0dd3f24a6
|
3 |
+
size 35136
|
Model/COSMIC/feature_extraction/epik-bin/label/valid.idx
ADDED
Binary file (105 kB). View file
|
|