Text Generation
gpt2
KuroFg1 commited on
Commit
469dcf2
·
verified ·
1 Parent(s): 9c3c814

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +28 -2
config.json CHANGED
@@ -1,3 +1,29 @@
1
  {
2
- "model_type": "qwen 2.5 72B"
3
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  {
2
+ "model_type": "gpt2",
3
+ "architectures": ["GPT2LMHeadModel"],
4
+ "vocab_size": 50257,
5
+ "n_positions": 1024,
6
+ "n_ctx": 1024,
7
+ "n_embd": 768,
8
+ "n_layer": 12,
9
+ "n_head": 12,
10
+ "activation_function": "gelu_new",
11
+ "resid_pdrop": 0.1,
12
+ "embd_pdrop": 0.1,
13
+ "attn_pdrop": 0.1,
14
+ "layer_norm_epsilon": 1e-5,
15
+ "bos_token_id": 50256,
16
+ "eos_token_id": 50256,
17
+ "pad_token_id": 50256,
18
+ "task_specific_params": {
19
+ "text-generation": {
20
+ "do_sample": true,
21
+ "max_length": 512,
22
+ "temperature": 0.8,
23
+ "top_p": 0.95,
24
+ "top_k": 50
25
+ }
26
+ },
27
+ "use_cache": true,
28
+ "summary": "ChatGPT-style conversational model fine-tuned from GPT-2 for dialogue and instruction-following."
29
+ }