cpi-connect commited on
Commit
77eacb7
·
1 Parent(s): 6d09a34

Upload model

Browse files
Files changed (5) hide show
  1. .gitattributes +1 -0
  2. config.json +14 -0
  3. configuration.py +16 -0
  4. model.py +66 -0
  5. pytorch_model.bin +3 -0
.gitattributes ADDED
@@ -0,0 +1 @@
 
 
1
+ pytorch_model.bin filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "CybersecurityKnowledgeGraphModel"
4
+ ],
5
+ "auto_map": {
6
+ "AutoConfig": "configuration.CybersecurityKnowledgeGraphConfig",
7
+ "AutoModelForTokenClassification": "model.CybersecurityKnowledgeGraphModel"
8
+ },
9
+ "event_argument_model_path": "cybersecurity_knowledge_graph/argument_model_state_dict.pth",
10
+ "event_nugget_model_path": "cybersecurity_knowledge_graph/nugget_model_state_dict.pth",
11
+ "event_realis_model_path": "cybersecurity_knowledge_graph/realis_model_state_dict.pth",
12
+ "torch_dtype": "float32",
13
+ "transformers_version": "4.33.2"
14
+ }
configuration.py ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from transformers import PretrainedConfig
2
+ import torch
3
+
4
+ class CybersecurityKnowledgeGraphConfig(PretrainedConfig):
5
+
6
+ def __init__(
7
+ self,
8
+ event_nugget_model_path : str = "nugget_model_state_dict.pth",
9
+ event_argument_model_path : str = "argument_model_state_dict.pth",
10
+ event_realis_model_path : str = "realis_model_state_dict.pth",
11
+ **kwargs,
12
+ ):
13
+ self.event_nugget_model_path = event_nugget_model_path
14
+ self.event_argument_model_path = event_argument_model_path
15
+ self.event_realis_model_path = event_realis_model_path
16
+ super().__init__(**kwargs)
model.py ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from transformers import PreTrainedModel
2
+ import torch
3
+
4
+ from cybersecurity_knowledge_graph.nugget_model_utils import CustomRobertaWithPOS as NuggetModel
5
+ from cybersecurity_knowledge_graph.args_model_utils import CustomRobertaWithPOS as ArgumentModel
6
+ from cybersecurity_knowledge_graph.realis_model_utils import CustomRobertaWithPOS as RealisModel
7
+
8
+ from cybersecurity_knowledge_graph.configuration import CybersecurityKnowledgeGraphConfig
9
+
10
+ from cybersecurity_knowledge_graph.event_nugget_predict import create_dataloader as event_nugget_dataloader
11
+ from cybersecurity_knowledge_graph.event_realis_predict import create_dataloader as event_realis_dataloader
12
+ from cybersecurity_knowledge_graph.event_arg_predict import create_dataloader as event_argument_dataloader
13
+
14
+ class CybersecurityKnowledgeGraphModel(PreTrainedModel):
15
+ config_class = CybersecurityKnowledgeGraphConfig
16
+
17
+ def __init__(self, config):
18
+ super().__init__(config)
19
+ self.event_nugget_model_path = config.event_nugget_model_path
20
+ self.event_argument_model_path = config.event_argument_model_path
21
+ self.event_realis_model_path = config.event_realis_model_path
22
+
23
+ self.event_nugget_dataloader = event_nugget_dataloader
24
+ self.event_argument_dataloader = event_argument_dataloader
25
+ self.event_realis_dataloader = event_realis_dataloader
26
+
27
+ self.event_nugget_model = NuggetModel(num_classes = 11)
28
+ self.event_argument_model = ArgumentModel(num_classes = 43)
29
+ self.event_realis_model = RealisModel(num_classes_realis = 4)
30
+
31
+ self.event_nugget_model.load_state_dict(torch.load(self.event_nugget_model_path))
32
+ self.event_realis_model.load_state_dict(torch.load(self.event_realis_model_path))
33
+ self.event_argument_model.load_state_dict(torch.load(self.event_argument_model_path))
34
+
35
+
36
+ def forward(self, text):
37
+ nugget_dataloader, _ = self.event_nugget_dataloader(text)
38
+ argument_dataloader, _ = self.event_argument_dataloader(text)
39
+ realis_dataloader, _ = self.event_realis_dataloader(text)
40
+
41
+ nugget_pred = self.forward_model(self.event_nugget_model, nugget_dataloader)
42
+ no_nuggets = torch.all(nugget_pred == 0, dim=1)
43
+
44
+ argument_preds = torch.empty(nugget_pred.size())
45
+ realis_preds = torch.empty(nugget_pred.size())
46
+ for idx, (batch, no_nugget) in enumerate(zip(nugget_pred, no_nuggets)):
47
+ if no_nugget:
48
+ argument_pred, realis_pred = torch.zeros(batch.size()), torch.zeros(batch.size())
49
+ else:
50
+ argument_pred = self.forward_model(self.event_argument_model, argument_dataloader)
51
+ realis_pred = self.forward_model(self.event_realis_model, realis_dataloader)
52
+ argument_preds[idx] = argument_pred
53
+ realis_preds[idx] = realis_pred
54
+
55
+ return {"nugget" : nugget_pred, "argument" : argument_pred, "realis" : realis_pred}
56
+
57
+ def forward_model(self, model, dataloader):
58
+ predicted_label = []
59
+ for batch in dataloader:
60
+ with torch.no_grad():
61
+ print(batch.keys())
62
+ logits = model(**batch)
63
+
64
+ batch_predicted_label = logits.argmax(-1)
65
+ predicted_label.append(batch_predicted_label)
66
+ return torch.cat(predicted_label, dim=-1)
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fef48b6b9271dd45d7102c4efd5a90a3e2897daeb2393dcbd6e4fc3aa94494c5
3
+ size 1496163441