Or4cl3-1 commited on
Commit
46216fd
1 Parent(s): 280875b

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +42 -35
config.json CHANGED
@@ -1,37 +1,44 @@
1
  {
2
- "model_type": "auto",
3
- "model_name_or_path": "Or4cl3-1/Daedalus_1",
4
- "tokenizer_name_or_path": "Or4cl3-1/Daedalus_1",
5
- "pad_to_max_length": true,
6
- "max_length": 1024,
7
- "num_beams": 4,
8
- "eos_token_id": 2,
9
- "length_penalty": 2.0,
10
- "no_repeat_ngram_size": 3,
11
- "early_stopping": True,
12
- "skip_special_tokens": True,
13
- "use_cache": True,
14
- "output_hidden_states": False,
15
- "output_attentions": False,
16
- "return_dict_in_generate": True,
17
- "forced_bos_token_id": 0,
18
- "forced_eos_token_id": 2,
19
- "remove_invalid_values": False,
20
- "torchscript": False,
21
- "use_multiprocessing": False,
22
- "bfloat16": False,
23
- "past_index": -1,
24
- "task_specific_params": {
25
- "summarization": {
26
- "num_beams": 8,
27
- "length_penalty": 1.0,
28
- "max_length": 128
29
  },
30
- "question-answering": {
31
- "num_beams": 8,
32
- "length_penalty": 1.0,
33
- "max_length": 384
34
- }
35
- }
36
- }
37
-
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  {
2
+ "model_name": "Daedalus_1: The Forge of Visionary Innovation",
3
+ "description": "A cutting-edge AI model blending CodeBERT, Codex, T5, SAM, Gemini, and Megatron for transformative innovation.",
4
+ "version": "1.0",
5
+ "author": "Or4cl3 AI Solutions",
6
+ "framework": "PyTorch",
7
+ "python_version": "3.x",
8
+ "deep_learning_framework": "PyTorch",
9
+ "constituent_models": [
10
+ {
11
+ "name": "Or4cl3-1/code-slerp",
12
+ "description": "Empowers Daedalus_1 with expertise in software engineering, code generation, and task-oriented language understanding."
13
+ },
14
+ {
15
+ "name": "Or4cl3-1/SAM-Gemini-BLOOM-OPT-Gopher-Megatron-slerp",
16
+ "description": "Provides Daedalus_1 with a deep, multifaceted understanding of complex concepts, human-like reasoning, and creativity."
17
+ }
18
+ ],
19
+ "architectural_design": {
20
+ "merge_method": "SLERP (Spherical Linear Interpolation)",
21
+ "selected_layers": 32
 
 
 
 
 
 
 
22
  },
23
+ "capabilities": [
24
+ "Rapid Prototyping and Code Generation",
25
+ "Multidisciplinary Understanding",
26
+ "Adaptability and Continuous Improvement",
27
+ "Ethical Considerations"
28
+ ],
29
+ "applications": [
30
+ "Software Development",
31
+ "Scientific Research",
32
+ "Creative Problem-Solving"
33
+ ],
34
+ "training_data": "Internal and External Datasets",
35
+ "training_steps": 200000,
36
+ "batch_size": 32,
37
+ "learning_rate": 0.0001,
38
+ "max_sequence_length": 1024,
39
+ "num_layers": 24,
40
+ "num_heads": 16,
41
+ "hidden_size": 1024,
42
+ "dropout_rate": 0.2,
43
+ "num_epochs": 20
44
+ }