Reinforcement Learning
kauiu commited on
Commit
867c0ac
·
verified ·
1 Parent(s): 16fe285

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +30 -5
README.md CHANGED
@@ -3,13 +3,12 @@ license: bsd
3
  datasets:
4
  - open-thoughts/OpenThoughts-114k
5
  - PJMixers-Dev/open-thoughts_OpenThoughts-114k-CustomShareGPT
6
- language:
7
- - aa
8
- - an
9
  base_model:
10
  - deepseek-ai/DeepSeek-V3
11
  - deepseek-ai/DeepSeek-R1
12
- pipeline_tag: text-generation
 
13
  ---
14
  # Model Card for Model ID
15
 
@@ -204,4 +203,30 @@ Carbon emissions can be estimated using the [Machine Learning Impact calculator]
204
 
205
  ## Model Card Contact
206
 
207
- [More Information Needed]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3
  datasets:
4
  - open-thoughts/OpenThoughts-114k
5
  - PJMixers-Dev/open-thoughts_OpenThoughts-114k-CustomShareGPT
6
+ - open-r1/OpenR1-Math-220k
 
 
7
  base_model:
8
  - deepseek-ai/DeepSeek-V3
9
  - deepseek-ai/DeepSeek-R1
10
+ pipeline_tag: question-answering
11
+ new_version: deepseek-ai/DeepSeek-R1
12
  ---
13
  # Model Card for Model ID
14
 
 
203
 
204
  ## Model Card Contact
205
 
206
+ [More Information Needed]
207
+ filter: [
208
+ {
209
+ bool: {
210
+ /// Include documents that match at least one of the following rules
211
+ should: [
212
+ /// Downloaded from diffusers lib
213
+ {
214
+ term: { path: "model_index.json" },
215
+ },
216
+ /// Direct downloads (LoRa, Auto1111 and others)
217
+ /// Filter out nested safetensors and pickle weights to avoid double counting downloads from the diffusers lib
218
+ {
219
+ regexp: { path: "[^/]*\\.safetensors" },
220
+ },
221
+ {
222
+ regexp: { path: "[^/]*\\.ckpt" },
223
+ },
224
+ {
225
+ regexp: { path: "[^/]*\\.bin" },
226
+ },
227
+ ],
228
+ minimum_should_match: 1,
229
+ },
230
+ },
231
+ ]
232
+ }