fdaudens HF staff commited on
Commit
12f90f1
·
verified ·
1 Parent(s): 119c95e

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -21,81 +21,39 @@
21
  "hidden_activation": "gelu",
22
  "hidden_size": 768,
23
  "id2label": {
24
- "0": "AI Applications",
25
- "1": "AI Infrastructure",
26
- "2": "Agents",
27
- "3": "Argilla",
28
- "4": "Audio",
29
- "5": "Cloud Deployment",
30
- "6": "Code",
31
- "7": "Computer Vision",
32
- "8": "Data Engineering",
33
- "9": "Data Science",
34
- "10": "Deep Learning",
35
- "11": "Embeddings",
36
- "12": "Ethics",
37
- "13": "Evaluation",
38
- "14": "Fine-Tuning",
39
- "15": "Gaming",
40
- "16": "Generative AI",
41
- "17": "Gradio",
42
- "18": "Hardware",
43
- "19": "Hugging Face",
44
- "20": "Image",
45
- "21": "LLMs",
46
- "22": "ML Theory",
47
- "23": "MLOps",
48
- "24": "Model Optimization",
49
- "25": "Multimodal",
50
- "26": "NLP",
51
- "27": "Reinforcement Learning",
52
- "28": "Research Papers",
53
- "29": "Robotics",
54
- "30": "Security",
55
- "31": "Time Series",
56
- "32": "Tutorials",
57
- "33": "Video",
58
- "34": "XetHub"
59
  },
60
  "initializer_cutoff_factor": 2.0,
61
  "initializer_range": 0.02,
62
  "intermediate_size": 1152,
63
  "label2id": {
64
- "AI Applications": 0,
65
- "AI Infrastructure": 1,
66
- "Agents": 2,
67
- "Argilla": 3,
68
- "Audio": 4,
69
- "Cloud Deployment": 5,
70
- "Code": 6,
71
- "Computer Vision": 7,
72
- "Data Engineering": 8,
73
- "Data Science": 9,
74
- "Deep Learning": 10,
75
- "Embeddings": 11,
76
- "Ethics": 12,
77
- "Evaluation": 13,
78
- "Fine-Tuning": 14,
79
- "Gaming": 15,
80
- "Generative AI": 16,
81
- "Gradio": 17,
82
- "Hardware": 18,
83
- "Hugging Face": 19,
84
- "Image": 20,
85
- "LLMs": 21,
86
- "ML Theory": 22,
87
- "MLOps": 23,
88
- "Model Optimization": 24,
89
- "Multimodal": 25,
90
- "NLP": 26,
91
- "Reinforcement Learning": 27,
92
- "Research Papers": 28,
93
- "Robotics": 29,
94
- "Security": 30,
95
- "Time Series": 31,
96
- "Tutorials": 32,
97
- "Video": 33,
98
- "XetHub": 34
99
  },
100
  "layer_norm_eps": 1e-05,
101
  "local_attention": 128,
@@ -110,12 +68,13 @@
110
  "num_hidden_layers": 22,
111
  "pad_token_id": 50283,
112
  "position_embedding_type": "absolute",
113
- "problem_type": "multi_label_classification",
114
  "reference_compile": true,
 
115
  "sep_token_id": 50282,
116
  "sparse_pred_ignore_index": -100,
117
  "sparse_prediction": false,
118
  "torch_dtype": "float32",
119
- "transformers_version": "4.48.0.dev0",
120
  "vocab_size": 50368
121
  }
 
21
  "hidden_activation": "gelu",
22
  "hidden_size": 768,
23
  "id2label": {
24
+ "0": "embeddings",
25
+ "1": "ai ethics",
26
+ "10": "data engineering",
27
+ "11": "robotics",
28
+ "12": "speech & audio",
29
+ "13": "code models",
30
+ "2": "game development",
31
+ "3": "llm evaluation",
32
+ "4": "rlhf",
33
+ "5": "deployment & infrastructure",
34
+ "6": "ml fundamentals",
35
+ "7": "vision & multimodal",
36
+ "8": "diffusion models",
37
+ "9": "hub & platform"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
38
  },
39
  "initializer_cutoff_factor": 2.0,
40
  "initializer_range": 0.02,
41
  "intermediate_size": 1152,
42
  "label2id": {
43
+ "ai ethics": "1",
44
+ "code models": "13",
45
+ "data engineering": "10",
46
+ "deployment & infrastructure": "5",
47
+ "diffusion models": "8",
48
+ "embeddings": "0",
49
+ "game development": "2",
50
+ "hub & platform": "9",
51
+ "llm evaluation": "3",
52
+ "ml fundamentals": "6",
53
+ "rlhf": "4",
54
+ "robotics": "11",
55
+ "speech & audio": "12",
56
+ "vision & multimodal": "7"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
57
  },
58
  "layer_norm_eps": 1e-05,
59
  "local_attention": 128,
 
68
  "num_hidden_layers": 22,
69
  "pad_token_id": 50283,
70
  "position_embedding_type": "absolute",
71
+ "problem_type": "single_label_classification",
72
  "reference_compile": true,
73
+ "repad_logits_with_grad": false,
74
  "sep_token_id": 50282,
75
  "sparse_pred_ignore_index": -100,
76
  "sparse_prediction": false,
77
  "torch_dtype": "float32",
78
+ "transformers_version": "4.48.0",
79
  "vocab_size": 50368
80
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d194be30d181b8cfb9202739e9f4b26972d406990975b65d04cc0e9f175d81bb
3
- size 598541300
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fdd5f191f0e54fd9c60d9f2b38a1aa12a1d66bafca92d538ad9a94b50f06a95
3
+ size 598476704
runs/Jan10_22-03-30_5e4eb05f69bb/events.out.tfevents.1736546616.5e4eb05f69bb.2578.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b524508fd26c66247528b91dd993a3591a54c36cfb9bbe651bb37e5bd3119dee
3
+ size 6862
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25bd22ddc0517daf7682a75eb884fa14c040494f0abb64be5908371babad56b0
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3c3573a3c15332c8382d24b442b2669b4d887d5b323de39035c48466545d860
3
  size 5432