mserras commited on
Commit
0704cb2
·
1 Parent(s): 6dbcc57

Update load_data.py

Browse files
Files changed (1) hide show
  1. load_data.py +3 -2
load_data.py CHANGED
@@ -11,6 +11,7 @@ from argilla.listeners import listener
11
 
12
  HF_TOKEN = os.environ.get("HF_TOKEN")
13
  HUB_DATASET_NAME = "mserras/alpaca-es-hackaton"
 
14
 
15
  @listener(
16
  dataset="somos-alpaca-es",
@@ -23,7 +24,7 @@ def save_validated_to_hub(records, ctx):
23
  if HF_TOKEN:
24
  print("Pushing the dataset")
25
  print(ds)
26
- ds.push_to_hub(HUB_DATASET_NAME, token=HF_TOKEN)
27
  else:
28
  print("SET HF_TOKEN and HUB_DATASET_NAME TO SYNC YOUR DATASET!!!")
29
  else:
@@ -70,7 +71,7 @@ class LoadDatasets:
70
  rg.log(
71
  records,
72
  name="somos-alpaca-es",
73
- tags={"description": "SomosNLP Hackathon dataset"},
74
  batch_size=200
75
  )
76
 
 
11
 
12
  HF_TOKEN = os.environ.get("HF_TOKEN")
13
  HUB_DATASET_NAME = "mserras/alpaca-es-hackaton"
14
+ HUB_DATASET_NAME_VAL = "mserras/alpaca-es-hackaton-validated"
15
 
16
  @listener(
17
  dataset="somos-alpaca-es",
 
24
  if HF_TOKEN:
25
  print("Pushing the dataset")
26
  print(ds)
27
+ ds.push_to_hub(HUB_DATASET_NAME_VAL, token=HF_TOKEN)
28
  else:
29
  print("SET HF_TOKEN and HUB_DATASET_NAME TO SYNC YOUR DATASET!!!")
30
  else:
 
71
  rg.log(
72
  records,
73
  name="somos-alpaca-es",
74
+ tags={"description": "SomosNLP Hackathon dataset - instruction filtering version"},
75
  batch_size=200
76
  )
77