lvj commited on
Commit
b56721a
·
1 Parent(s): 8aeab33

Upload folder using huggingface_hub

Browse files
Files changed (3) hide show
  1. .gitattributes +2 -0
  2. config.json +27 -11
  3. training_args.bin +0 -0
.gitattributes ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ pytorch_model.bin filter=lfs diff=lfs merge=lfs -text
2
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -129,25 +129,41 @@
129
  },
130
  "model.embed_tokens": {
131
  "_data": {
132
- "activation_quantization": "int8_asym_per_token",
133
- "b": 2,
134
- "granularity": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
135
  "_data": {
136
  "axis": 0
137
  },
138
  "_type": "PerAxis",
139
  "_version": 1
140
  },
141
- "layout": {
142
- "_data": {},
143
- "_type": "QDQLayout",
144
- "_version": 1
145
  },
146
- "quant_max": 1.5,
147
- "quant_min": -1.5,
148
- "scale_dtype": null
149
  },
150
- "_type": "StretchedIntxWeightConfig",
151
  "_version": 2
152
  }
153
  }
 
129
  },
130
  "model.embed_tokens": {
131
  "_data": {
132
+ "act_mapping_type": {
133
+ "_data": "ASYMMETRIC",
134
+ "_type": "MappingType"
135
+ },
136
+ "intx_choose_qparams_algorithm": {
137
+ "_data": "AFFINE",
138
+ "_type": "IntxChooseQParamsAlgorithm"
139
+ },
140
+ "intx_packing_format": {
141
+ "_data": "UNPACKED_TO_INT8",
142
+ "_type": "IntxPackingFormat"
143
+ },
144
+ "layout": {
145
+ "_data": {},
146
+ "_type": "QDQLayout",
147
+ "_version": 1
148
+ },
149
+ "weight_dtype": {
150
+ "_data": "int4",
151
+ "_type": "torch.dtype"
152
+ },
153
+ "weight_granularity": {
154
  "_data": {
155
  "axis": 0
156
  },
157
  "_type": "PerAxis",
158
  "_version": 1
159
  },
160
+ "weight_mapping_type": {
161
+ "_data": "SYMMETRIC",
162
+ "_type": "MappingType"
 
163
  },
164
+ "weight_scale_dtype": null
 
 
165
  },
166
+ "_type": "Int8DynamicActivationIntxWeightConfig",
167
  "_version": 2
168
  }
169
  }
training_args.bin CHANGED
Binary files a/training_args.bin and b/training_args.bin differ