igor commited on
Commit
554833e
1 Parent(s): 2db91ae

added onnx model (fake quant) compatible with trt

Browse files
Files changed (3) hide show
  1. .gitattributes +1 -0
  2. gptj-i8.data +3 -0
  3. gptj-i8.onnx +3 -0
.gitattributes CHANGED
@@ -3,6 +3,7 @@
3
  *.bin filter=lfs diff=lfs merge=lfs -text
4
  *.bz2 filter=lfs diff=lfs merge=lfs -text
5
  *.ckpt filter=lfs diff=lfs merge=lfs -text
 
6
  *.engine filter=lfs diff=lfs merge=lfs -text
7
  *.ftz filter=lfs diff=lfs merge=lfs -text
8
  *.gz filter=lfs diff=lfs merge=lfs -text
 
3
  *.bin filter=lfs diff=lfs merge=lfs -text
4
  *.bz2 filter=lfs diff=lfs merge=lfs -text
5
  *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.data filter=lfs diff=lfs merge=lfs -text
7
  *.engine filter=lfs diff=lfs merge=lfs -text
8
  *.ftz filter=lfs diff=lfs merge=lfs -text
9
  *.gz filter=lfs diff=lfs merge=lfs -text
gptj-i8.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f63ee9c5642110c58e63a3e92bce93c6034221679b245f910a46eda8d98f1514
3
+ size 24326843360
gptj-i8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d90c5e2d1aab516d3727a92415a5b691fb5debf512b6b8311f91f7cdf17a6e5
3
+ size 1605007